In [1]:
from pathlib import Path
from docling.document_converter import DocumentConverter

def process_files(crawl_dir, processed_dir):
    input_path = Path(crawl_dir)
    processed_path = Path(processed_dir)
    processed_path.mkdir(parents=True, exist_ok=True)

    input_files = list(input_path.glob('*')) 
    print(f"Found {len(input_files)} files to process in {input_path}")

    converter = DocumentConverter(format_options={"preserve_links": True})

    files_processed = 0
    errors = 0

    for input_file in input_files:
        file_ext = input_file.suffix.lower()
        md_file_name = processed_path / f"{input_file.stem}.md"

        if md_file_name.exists():
            print(f"Skipping '{input_file.name}' — already processed.")
            continue

        try:
            result = converter.convert(input_file)
            markdown_content = result.document.export_to_markdown()
            
            with open(md_file_name, "w", encoding="utf-8") as md_file:
                md_file.write(markdown_content)
                
            print(f"Converted '{input_file}' --> '{md_file_name}'")
            files_processed += 1
            
        except Exception as e:
            errors += 1
            print(f"Error processing {input_file}: {e}")

    print(f"Processed {files_processed} new files. Errors: {errors}")

  from .autonotebook import tqdm as notebook_tqdm


In [None]:
# process the edgar documents
import os

crawl_dir = 'data/edgar_documents'
processed_dir = 'data/processed_data'

entries = os.listdir(crawl_dir)
ticker_folders = []
for entry in entries:
    full_path = crawl_dir + '/' + entry
    if os.path.isdir(full_path):
        ticker_folders.append(entry)
print(ticker_folders)

for folder in ticker_folders:
    full_path = crawl_dir + '/' + folder
    output_dir = processed_dir + '/' + folder
    process_files(crawl_dir=full_path, processed_dir=output_dir)



2025-11-14 15:25:15,781 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:25:15,782 - ERROR - Input document 4_2023-05-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:25:15,786 - INFO - Going to convert document batch...
2025-11-14 15:25:15,794 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:25:15,795 - ERROR - Input document 4_2023-05-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

['AAPL', 'ABBV', 'ABT', 'ACN', 'ADBE', 'AIG', 'AMD', 'AMGN', 'AMT', 'AMZN', 'AVGO', 'AXP', 'BA', 'BK', 'BKNG', 'BLK', 'BMY', 'BRK-B', 'CAT', 'CHTR', 'CL', 'CMCSA', 'COF', 'COP', 'COST', 'CRM', 'CSCO', 'CVS', 'CVX', 'DE', 'DHR', 'DIS', 'DUK', 'EMR', 'FDX', 'GD', 'GE', 'GILD', 'GM', 'GOOGL', 'HD', 'HON', 'IBM', 'INTC', 'INTU', 'ISRG', 'JNJ', 'KO', 'LIN', 'LLY', 'LMT', 'LOW', 'MA', 'MCD', 'MDLZ', 'MDT', 'MET', 'META', 'MMM', 'MO', 'MRK', 'MSFT', 'NEE', 'NFLX', 'NKE', 'NOW', 'NVDA', 'ORCL', 'PEP', 'PFE', 'PG', 'PLTR', 'PM', 'PYPL', 'QCOM', 'RTX', 'SBUX', 'SCHW', 'SO', 'SPG', 'T', 'TGT', 'TMO', 'TMUS', 'TSLA', 'TXN', 'UNH', 'UNP', 'UPS', 'USB', 'V', 'VZ', 'WFC', 'WMT', 'XOM']
Found 91 files to process in data\edgar_documents\AAPL
Skipping '10-K_2023-11-03' — already processed.
Skipping '10-K_2024-11-01' — already processed.
Skipping '10-K_2025-10-31' — already processed.
Skipping '10-Q_2023-02-03' — already processed.
Skipping '10-Q_2023-05-05' — already processed.
Skipping '10-Q_2023-08-04

2025-11-14 15:25:15,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:17,062 - INFO - Going to convert document batch...
2025-11-14 15:25:17,062 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:25:17,063 - INFO - Processing document 10-K_2023-02-17
2025-11-14 15:25:19,639 - INFO - Finished converting document 10-K_2023-02-17 in 3.77 sec.
2025-11-14 15:25:20,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-K_2023-02-17' --> 'data\processed_data\ABBV\10-K_2023-02-17.md'


2025-11-14 15:25:21,470 - INFO - Going to convert document batch...
2025-11-14 15:25:21,473 - INFO - Processing document 10-K_2024-02-20
2025-11-14 15:25:23,983 - INFO - Finished converting document 10-K_2024-02-20 in 3.64 sec.
2025-11-14 15:25:24,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-K_2024-02-20' --> 'data\processed_data\ABBV\10-K_2024-02-20.md'


2025-11-14 15:25:26,098 - INFO - Going to convert document batch...
2025-11-14 15:25:26,099 - INFO - Processing document 10-K_2025-02-14
2025-11-14 15:25:29,061 - INFO - Finished converting document 10-K_2025-02-14 in 4.34 sec.
2025-11-14 15:25:29,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-K_2025-02-14' --> 'data\processed_data\ABBV\10-K_2025-02-14.md'


2025-11-14 15:25:30,634 - INFO - Going to convert document batch...
2025-11-14 15:25:30,636 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 15:25:31,436 - INFO - Finished converting document 10-Q_2023-05-05 in 1.64 sec.
2025-11-14 15:25:31,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2023-05-05' --> 'data\processed_data\ABBV\10-Q_2023-05-05.md'


2025-11-14 15:25:32,343 - INFO - Going to convert document batch...
2025-11-14 15:25:32,344 - INFO - Processing document 10-Q_2023-08-07
2025-11-14 15:25:33,323 - INFO - Finished converting document 10-Q_2023-08-07 in 1.52 sec.
2025-11-14 15:25:33,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2023-08-07' --> 'data\processed_data\ABBV\10-Q_2023-08-07.md'


2025-11-14 15:25:34,706 - INFO - Going to convert document batch...
2025-11-14 15:25:34,707 - INFO - Processing document 10-Q_2023-11-06
2025-11-14 15:25:35,689 - INFO - Finished converting document 10-Q_2023-11-06 in 1.98 sec.
2025-11-14 15:25:36,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2023-11-06' --> 'data\processed_data\ABBV\10-Q_2023-11-06.md'


2025-11-14 15:25:36,862 - INFO - Going to convert document batch...
2025-11-14 15:25:36,864 - INFO - Processing document 10-Q_2024-05-03
2025-11-14 15:25:37,746 - INFO - Finished converting document 10-Q_2024-05-03 in 1.67 sec.
2025-11-14 15:25:38,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2024-05-03' --> 'data\processed_data\ABBV\10-Q_2024-05-03.md'


2025-11-14 15:25:38,617 - INFO - Going to convert document batch...
2025-11-14 15:25:38,617 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 15:25:40,009 - INFO - Finished converting document 10-Q_2024-08-07 in 1.89 sec.
2025-11-14 15:25:40,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2024-08-07' --> 'data\processed_data\ABBV\10-Q_2024-08-07.md'


2025-11-14 15:25:40,951 - INFO - Going to convert document batch...
2025-11-14 15:25:40,951 - INFO - Processing document 10-Q_2024-11-04
2025-11-14 15:25:42,025 - INFO - Finished converting document 10-Q_2024-11-04 in 1.59 sec.
2025-11-14 15:25:42,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2024-11-04' --> 'data\processed_data\ABBV\10-Q_2024-11-04.md'


2025-11-14 15:25:43,210 - INFO - Going to convert document batch...
2025-11-14 15:25:43,211 - INFO - Processing document 10-Q_2025-05-09
2025-11-14 15:25:44,026 - INFO - Finished converting document 10-Q_2025-05-09 in 1.58 sec.
2025-11-14 15:25:44,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2025-05-09' --> 'data\processed_data\ABBV\10-Q_2025-05-09.md'


2025-11-14 15:25:45,221 - INFO - Going to convert document batch...
2025-11-14 15:25:45,222 - INFO - Processing document 10-Q_2025-08-04
2025-11-14 15:25:46,207 - INFO - Finished converting document 10-Q_2025-08-04 in 1.81 sec.
2025-11-14 15:25:46,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2025-08-04' --> 'data\processed_data\ABBV\10-Q_2025-08-04.md'


2025-11-14 15:25:47,215 - INFO - Going to convert document batch...
2025-11-14 15:25:47,216 - INFO - Processing document 10-Q_2025-11-04
2025-11-14 15:25:48,605 - INFO - Finished converting document 10-Q_2025-11-04 in 2.00 sec.
2025-11-14 15:25:49,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,051 - INFO - Going to convert document batch...
2025-11-14 15:25:49,051 - INFO - Processing document 4_2023-01-03
2025-11-14 15:25:49,070 - INFO - Finished converting document 4_2023-01-03 in 0.03 sec.
2025-11-14 15:25:49,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,119 - INFO - Going to convert document batch...
2025-11-14 15:25:49,119 - INFO - Processing document 4_2023-02-21
2025-11-14 15:25:49,136 - INFO - Finished converting document 4_2023-02-21 in 0.05 sec.
2025-11-14 15:25:49,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,194 - INFO - Going to convert document batch...
2025-11-14 15:25:49,

Converted 'data\edgar_documents\ABBV\10-Q_2025-11-04' --> 'data\processed_data\ABBV\10-Q_2025-11-04.md'
Converted 'data\edgar_documents\ABBV\4_2023-01-03' --> 'data\processed_data\ABBV\4_2023-01-03.md'
Converted 'data\edgar_documents\ABBV\4_2023-02-21' --> 'data\processed_data\ABBV\4_2023-02-21.md'


2025-11-14 15:25:49,217 - INFO - Finished converting document 4_2023-02-22 in 0.06 sec.
2025-11-14 15:25:49,253 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,261 - INFO - Going to convert document batch...
2025-11-14 15:25:49,262 - INFO - Processing document 4_2023-03-02
2025-11-14 15:25:49,280 - INFO - Finished converting document 4_2023-03-02 in 0.05 sec.
2025-11-14 15:25:49,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,341 - INFO - Going to convert document batch...
2025-11-14 15:25:49,342 - INFO - Processing document 4_2023-03-07
2025-11-14 15:25:49,362 - INFO - Finished converting document 4_2023-03-07 in 0.06 sec.
2025-11-14 15:25:49,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,424 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\4_2023-02-22' --> 'data\processed_data\ABBV\4_2023-02-22.md'
Converted 'data\edgar_documents\ABBV\4_2023-03-02' --> 'data\processed_data\ABBV\4_2023-03-02.md'
Converted 'data\edgar_documents\ABBV\4_2023-03-07' --> 'data\processed_data\ABBV\4_2023-03-07.md'


2025-11-14 15:25:49,425 - INFO - Processing document 4_2023-03-15
2025-11-14 15:25:49,449 - INFO - Finished converting document 4_2023-03-15 in 0.08 sec.
2025-11-14 15:25:49,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,492 - INFO - Going to convert document batch...
2025-11-14 15:25:49,495 - INFO - Processing document 4_2023-04-04
2025-11-14 15:25:49,519 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.
2025-11-14 15:25:49,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,584 - INFO - Going to convert document batch...
2025-11-14 15:25:49,584 - INFO - Processing document 4_2023-04-05
2025-11-14 15:25:49,605 - INFO - Finished converting document 4_2023-04-05 in 0.06 sec.
2025-11-14 15:25:49,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,656 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\4_2023-03-15' --> 'data\processed_data\ABBV\4_2023-03-15.md'
Converted 'data\edgar_documents\ABBV\4_2023-04-04' --> 'data\processed_data\ABBV\4_2023-04-04.md'
Converted 'data\edgar_documents\ABBV\4_2023-04-05' --> 'data\processed_data\ABBV\4_2023-04-05.md'


2025-11-14 15:25:49,656 - INFO - Processing document 4_2023-04-19
2025-11-14 15:25:49,677 - INFO - Finished converting document 4_2023-04-19 in 0.05 sec.
2025-11-14 15:25:49,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,724 - INFO - Going to convert document batch...
2025-11-14 15:25:49,725 - INFO - Processing document 4_2023-04-27
2025-11-14 15:25:49,746 - INFO - Finished converting document 4_2023-04-27 in 0.05 sec.
2025-11-14 15:25:49,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,810 - INFO - Going to convert document batch...
2025-11-14 15:25:49,812 - INFO - Processing document 4_2023-05-02
2025-11-14 15:25:49,833 - INFO - Finished converting document 4_2023-05-02 in 0.06 sec.
2025-11-14 15:25:49,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,879 - INFO - Going to convert document batch...
2025-11-14 15:25:49,880 - INFO - Processing document 4_2023-05-09
2025-11-14 15:25:49,899 - IN

Converted 'data\edgar_documents\ABBV\4_2023-04-19' --> 'data\processed_data\ABBV\4_2023-04-19.md'
Converted 'data\edgar_documents\ABBV\4_2023-04-27' --> 'data\processed_data\ABBV\4_2023-04-27.md'
Converted 'data\edgar_documents\ABBV\4_2023-05-02' --> 'data\processed_data\ABBV\4_2023-05-02.md'


2025-11-14 15:25:49,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,947 - INFO - Going to convert document batch...
2025-11-14 15:25:49,948 - INFO - Processing document 4_2023-05-12
2025-11-14 15:25:49,966 - INFO - Finished converting document 4_2023-05-12 in 0.05 sec.
2025-11-14 15:25:50,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,012 - INFO - Going to convert document batch...
2025-11-14 15:25:50,013 - INFO - Processing document 4_2023-07-05
2025-11-14 15:25:50,035 - INFO - Finished converting document 4_2023-07-05 in 0.05 sec.
2025-11-14 15:25:50,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,105 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\4_2023-05-09' --> 'data\processed_data\ABBV\4_2023-05-09.md'
Converted 'data\edgar_documents\ABBV\4_2023-05-12' --> 'data\processed_data\ABBV\4_2023-05-12.md'
Converted 'data\edgar_documents\ABBV\4_2023-07-05' --> 'data\processed_data\ABBV\4_2023-07-05.md'


2025-11-14 15:25:50,106 - INFO - Processing document 4_2023-08-02
2025-11-14 15:25:50,155 - INFO - Finished converting document 4_2023-08-02 in 0.09 sec.
2025-11-14 15:25:50,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,202 - INFO - Going to convert document batch...
2025-11-14 15:25:50,203 - INFO - Processing document 4_2023-09-11
2025-11-14 15:25:50,220 - INFO - Finished converting document 4_2023-09-11 in 0.03 sec.
2025-11-14 15:25:50,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,279 - INFO - Going to convert document batch...
2025-11-14 15:25:50,280 - INFO - Processing document 4_2023-09-27
2025-11-14 15:25:50,302 - INFO - Finished converting document 4_2023-09-27 in 0.06 sec.
2025-11-14 15:25:50,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,342 - INFO - Going to convert document batch...
2025-11-14 15:25:50,343 - INFO - Processing document 4_2023-10-03
2025-11-14 15:25:50,363 - IN

Converted 'data\edgar_documents\ABBV\4_2023-08-02' --> 'data\processed_data\ABBV\4_2023-08-02.md'
Converted 'data\edgar_documents\ABBV\4_2023-09-11' --> 'data\processed_data\ABBV\4_2023-09-11.md'
Converted 'data\edgar_documents\ABBV\4_2023-09-27' --> 'data\processed_data\ABBV\4_2023-09-27.md'
Converted 'data\edgar_documents\ABBV\4_2023-10-03' --> 'data\processed_data\ABBV\4_2023-10-03.md'


2025-11-14 15:25:50,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,428 - INFO - Going to convert document batch...
2025-11-14 15:25:50,429 - INFO - Processing document 4_2023-12-28
2025-11-14 15:25:50,450 - INFO - Finished converting document 4_2023-12-28 in 0.06 sec.
2025-11-14 15:25:50,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,491 - INFO - Going to convert document batch...
2025-11-14 15:25:50,491 - INFO - Processing document 4_2024-01-03
2025-11-14 15:25:50,513 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:25:50,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,555 - INFO - Going to convert document batch...
2025-11-14 15:25:50,556 - INFO - Processing document 4_2024-02-06
2025-11-14 15:25:50,578 - INFO - Finished converting document 4_2024-02-06 in 0.05 sec.
2025-11-14 15:25:50,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\4_2023-12-28' --> 'data\processed_data\ABBV\4_2023-12-28.md'
Converted 'data\edgar_documents\ABBV\4_2024-01-03' --> 'data\processed_data\ABBV\4_2024-01-03.md'
Converted 'data\edgar_documents\ABBV\4_2024-02-06' --> 'data\processed_data\ABBV\4_2024-02-06.md'


2025-11-14 15:25:50,719 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:25:50,720 - ERROR - Input document 4_2024-02-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:25:50,721 - INFO - Going to convert document batch...
2025-11-14 15:25:50,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,744 - INFO - Going to convert document batch...
2025-11-14 15:25:50,745 - INFO - Processing document 4_2024-02-23
2025-11-14 15:25:50,768 - INFO - Fin

Converted 'data\edgar_documents\ABBV\4_2024-02-20' --> 'data\processed_data\ABBV\4_2024-02-20.md'
Error processing data\edgar_documents\ABBV\4_2024-02-21: File format not allowed: data\edgar_documents\ABBV\4_2024-02-21
Converted 'data\edgar_documents\ABBV\4_2024-02-23' --> 'data\processed_data\ABBV\4_2024-02-23.md'
Error processing data\edgar_documents\ABBV\4_2024-02-26: File format not allowed: data\edgar_documents\ABBV\4_2024-02-26


2025-11-14 15:25:50,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,917 - INFO - Going to convert document batch...
2025-11-14 15:25:50,918 - INFO - Processing document 4_2024-02-29
2025-11-14 15:25:50,937 - INFO - Finished converting document 4_2024-02-29 in 0.05 sec.
2025-11-14 15:25:50,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,002 - INFO - Going to convert document batch...
2025-11-14 15:25:51,003 - INFO - Processing document 4_2024-03-01
2025-11-14 15:25:51,026 - INFO - Finished converting document 4_2024-03-01 in 0.08 sec.
2025-11-14 15:25:51,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,074 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\4_2024-02-27' --> 'data\processed_data\ABBV\4_2024-02-27.md'
Converted 'data\edgar_documents\ABBV\4_2024-02-29' --> 'data\processed_data\ABBV\4_2024-02-29.md'
Converted 'data\edgar_documents\ABBV\4_2024-03-01' --> 'data\processed_data\ABBV\4_2024-03-01.md'


2025-11-14 15:25:51,075 - INFO - Processing document 4_2024-03-05
2025-11-14 15:25:51,102 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 15:25:51,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,149 - INFO - Going to convert document batch...
2025-11-14 15:25:51,149 - INFO - Processing document 4_2024-03-20
2025-11-14 15:25:51,175 - INFO - Finished converting document 4_2024-03-20 in 0.05 sec.
2025-11-14 15:25:51,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,221 - INFO - Going to convert document batch...
2025-11-14 15:25:51,221 - INFO - Processing document 4_2024-03-22
2025-11-14 15:25:51,237 - INFO - Finished converting document 4_2024-03-22 in 0.03 sec.
2025-11-14 15:25:51,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,299 - INFO - Going to convert document batch...
2025-11-14 15:25:51,300 - INFO - Processing document 4_2024-04-02
2025-11-14 15:25:51,317 - IN

Converted 'data\edgar_documents\ABBV\4_2024-03-05' --> 'data\processed_data\ABBV\4_2024-03-05.md'
Converted 'data\edgar_documents\ABBV\4_2024-03-20' --> 'data\processed_data\ABBV\4_2024-03-20.md'
Converted 'data\edgar_documents\ABBV\4_2024-03-22' --> 'data\processed_data\ABBV\4_2024-03-22.md'


2025-11-14 15:25:51,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,358 - INFO - Going to convert document batch...
2025-11-14 15:25:51,359 - INFO - Processing document 4_2024-05-07
2025-11-14 15:25:51,381 - INFO - Finished converting document 4_2024-05-07 in 0.05 sec.
2025-11-14 15:25:51,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,421 - INFO - Going to convert document batch...
2025-11-14 15:25:51,421 - INFO - Processing document 4_2024-07-02
2025-11-14 15:25:51,439 - INFO - Finished converting document 4_2024-07-02 in 0.05 sec.
2025-11-14 15:25:51,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,484 - INFO - Going to convert document batch...
2025-11-14 15:25:51,485 - INFO - Processing document 4_2024-07-19
2025-11-14 15:25:51,517 - INFO - Finished converting document 4_2024-07-19 in 0.06 sec.


Converted 'data\edgar_documents\ABBV\4_2024-04-02' --> 'data\processed_data\ABBV\4_2024-04-02.md'
Converted 'data\edgar_documents\ABBV\4_2024-05-07' --> 'data\processed_data\ABBV\4_2024-05-07.md'
Converted 'data\edgar_documents\ABBV\4_2024-07-02' --> 'data\processed_data\ABBV\4_2024-07-02.md'


2025-11-14 15:25:51,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,579 - INFO - Going to convert document batch...
2025-11-14 15:25:51,580 - INFO - Processing document 4_2024-08-07
2025-11-14 15:25:51,602 - INFO - Finished converting document 4_2024-08-07 in 0.05 sec.
2025-11-14 15:25:51,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,642 - INFO - Going to convert document batch...
2025-11-14 15:25:51,642 - INFO - Processing document 4_2024-09-30
2025-11-14 15:25:51,661 - INFO - Finished converting document 4_2024-09-30 in 0.03 sec.
2025-11-14 15:25:51,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,700 - INFO - Going to convert document batch...
2025-11-14 15:25:51,701 - INFO - Processing document 4_2024-10-02
2025-11-14 15:25:51,719 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.


Converted 'data\edgar_documents\ABBV\4_2024-07-19' --> 'data\processed_data\ABBV\4_2024-07-19.md'
Converted 'data\edgar_documents\ABBV\4_2024-08-07' --> 'data\processed_data\ABBV\4_2024-08-07.md'
Converted 'data\edgar_documents\ABBV\4_2024-09-30' --> 'data\processed_data\ABBV\4_2024-09-30.md'
Converted 'data\edgar_documents\ABBV\4_2024-10-02' --> 'data\processed_data\ABBV\4_2024-10-02.md'


2025-11-14 15:25:51,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,782 - INFO - Going to convert document batch...
2025-11-14 15:25:51,783 - INFO - Processing document 4_2024-12-18
2025-11-14 15:25:51,802 - INFO - Finished converting document 4_2024-12-18 in 0.06 sec.
2025-11-14 15:25:51,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,841 - INFO - Going to convert document batch...
2025-11-14 15:25:51,842 - INFO - Processing document 4_2025-01-03
2025-11-14 15:25:51,862 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 15:25:51,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,902 - INFO - Going to convert document batch...
2025-11-14 15:25:51,903 - INFO - Processing document 4_2025-02-07
2025-11-14 15:25:51,928 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.
2025-11-14 15:25:51,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\4_2024-12-18' --> 'data\processed_data\ABBV\4_2024-12-18.md'
Converted 'data\edgar_documents\ABBV\4_2025-01-03' --> 'data\processed_data\ABBV\4_2025-01-03.md'
Converted 'data\edgar_documents\ABBV\4_2025-02-07' --> 'data\processed_data\ABBV\4_2025-02-07.md'


2025-11-14 15:25:52,047 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:25:52,048 - ERROR - Input document 4_2025-02-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:25:52,050 - INFO - Going to convert document batch...
2025-11-14 15:25:52,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,071 - INFO - Going to convert document batch...
2025-11-14 15:25:52,072 - INFO - Processing document 4_2025-02-24
2025-11-14 15:25:52,090 - INFO - Fin

Converted 'data\edgar_documents\ABBV\4_2025-02-18' --> 'data\processed_data\ABBV\4_2025-02-18.md'
Error processing data\edgar_documents\ABBV\4_2025-02-20: File format not allowed: data\edgar_documents\ABBV\4_2025-02-20
Converted 'data\edgar_documents\ABBV\4_2025-02-24' --> 'data\processed_data\ABBV\4_2025-02-24.md'
Converted 'data\edgar_documents\ABBV\4_2025-02-28' --> 'data\processed_data\ABBV\4_2025-02-28.md'


2025-11-14 15:25:52,204 - INFO - Processing document 4_2025-03-04
2025-11-14 15:25:52,222 - INFO - Finished converting document 4_2025-03-04 in 0.03 sec.
2025-11-14 15:25:52,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,259 - INFO - Going to convert document batch...
2025-11-14 15:25:52,260 - INFO - Processing document 4_2025-03-18
2025-11-14 15:25:52,277 - INFO - Finished converting document 4_2025-03-18 in 0.05 sec.
2025-11-14 15:25:52,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,349 - INFO - Going to convert document batch...
2025-11-14 15:25:52,349 - INFO - Processing document 4_2025-04-02
2025-11-14 15:25:52,368 - INFO - Finished converting document 4_2025-04-02 in 0.05 sec.
2025-11-14 15:25:52,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,409 - INFO - Going to convert document batch...
2025-11-14 15:25:52,410 - INFO - Processing document 4_2025-05-13
2025-11-14 15:25:52,429 - IN

Converted 'data\edgar_documents\ABBV\4_2025-03-04' --> 'data\processed_data\ABBV\4_2025-03-04.md'
Converted 'data\edgar_documents\ABBV\4_2025-03-18' --> 'data\processed_data\ABBV\4_2025-03-18.md'
Converted 'data\edgar_documents\ABBV\4_2025-04-02' --> 'data\processed_data\ABBV\4_2025-04-02.md'


2025-11-14 15:25:52,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,469 - INFO - Going to convert document batch...
2025-11-14 15:25:52,471 - INFO - Processing document 4_2025-07-02
2025-11-14 15:25:52,491 - INFO - Finished converting document 4_2025-07-02 in 0.03 sec.
2025-11-14 15:25:52,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,555 - INFO - Going to convert document batch...
2025-11-14 15:25:52,556 - INFO - Processing document 4_2025-08-07
2025-11-14 15:25:52,577 - INFO - Finished converting document 4_2025-08-07 in 0.06 sec.
2025-11-14 15:25:52,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,620 - INFO - Going to convert document batch...
2025-11-14 15:25:52,620 - INFO - Processing document 4_2025-08-14
2025-11-14 15:25:52,642 - INFO - Finished converting document 4_2025-08-14 in 0.05 sec.


Converted 'data\edgar_documents\ABBV\4_2025-05-13' --> 'data\processed_data\ABBV\4_2025-05-13.md'
Converted 'data\edgar_documents\ABBV\4_2025-07-02' --> 'data\processed_data\ABBV\4_2025-07-02.md'
Converted 'data\edgar_documents\ABBV\4_2025-08-07' --> 'data\processed_data\ABBV\4_2025-08-07.md'


2025-11-14 15:25:52,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,684 - INFO - Going to convert document batch...
2025-11-14 15:25:52,685 - INFO - Processing document 4_2025-10-02
2025-11-14 15:25:52,704 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 15:25:52,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,753 - INFO - Going to convert document batch...
2025-11-14 15:25:52,754 - INFO - Processing document 8-K_2023-01-06
2025-11-14 15:25:52,774 - INFO - Finished converting document 8-K_2023-01-06 in 0.05 sec.
2025-11-14 15:25:52,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,816 - INFO - Going to convert document batch...
2025-11-14 15:25:52,816 - INFO - Processing document 8-K_2023-01-10
2025-11-14 15:25:52,838 - INFO - Finished converting document 8-K_2023-01-10 in 0.05 sec.


Converted 'data\edgar_documents\ABBV\4_2025-08-14' --> 'data\processed_data\ABBV\4_2025-08-14.md'
Converted 'data\edgar_documents\ABBV\4_2025-10-02' --> 'data\processed_data\ABBV\4_2025-10-02.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-01-06' --> 'data\processed_data\ABBV\8-K_2023-01-06.md'


2025-11-14 15:25:52,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,887 - INFO - Going to convert document batch...
2025-11-14 15:25:52,889 - INFO - Processing document 8-K_2023-02-09
2025-11-14 15:25:52,912 - INFO - Finished converting document 8-K_2023-02-09 in 0.05 sec.
2025-11-14 15:25:52,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,950 - INFO - Going to convert document batch...
2025-11-14 15:25:52,951 - INFO - Processing document 8-K_2023-03-28
2025-11-14 15:25:52,976 - INFO - Finished converting document 8-K_2023-03-28 in 0.05 sec.
2025-11-14 15:25:53,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,044 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\8-K_2023-01-10' --> 'data\processed_data\ABBV\8-K_2023-01-10.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-02-09' --> 'data\processed_data\ABBV\8-K_2023-02-09.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-03-28' --> 'data\processed_data\ABBV\8-K_2023-03-28.md'


2025-11-14 15:25:53,045 - INFO - Processing document 8-K_2023-04-05
2025-11-14 15:25:53,068 - INFO - Finished converting document 8-K_2023-04-05 in 0.08 sec.
2025-11-14 15:25:53,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,108 - INFO - Going to convert document batch...
2025-11-14 15:25:53,110 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:25:53,132 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 15:25:53,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,179 - INFO - Going to convert document batch...
2025-11-14 15:25:53,179 - INFO - Processing document 8-K_2023-05-10
2025-11-14 15:25:53,221 - INFO - Finished converting document 8-K_2023-05-10 in 0.08 sec.
2025-11-14 15:25:53,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,266 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\8-K_2023-04-05' --> 'data\processed_data\ABBV\8-K_2023-04-05.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-04-27' --> 'data\processed_data\ABBV\8-K_2023-04-27.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-05-10' --> 'data\processed_data\ABBV\8-K_2023-05-10.md'


2025-11-14 15:25:53,267 - INFO - Processing document 8-K_2023-06-29
2025-11-14 15:25:53,288 - INFO - Finished converting document 8-K_2023-06-29 in 0.05 sec.
2025-11-14 15:25:53,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,333 - INFO - Going to convert document batch...
2025-11-14 15:25:53,334 - INFO - Processing document 8-K_2023-07-06
2025-11-14 15:25:53,355 - INFO - Finished converting document 8-K_2023-07-06 in 0.06 sec.
2025-11-14 15:25:53,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,396 - INFO - Going to convert document batch...
2025-11-14 15:25:53,398 - INFO - Processing document 8-K_2023-07-27
2025-11-14 15:25:53,416 - INFO - Finished converting document 8-K_2023-07-27 in 0.05 sec.
2025-11-14 15:25:53,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,456 - INFO - Going to convert document batch...
2025-11-14 15:25:53,457 - INFO - Processing document 8-K_2023-10-04
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\8-K_2023-06-29' --> 'data\processed_data\ABBV\8-K_2023-06-29.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-07-06' --> 'data\processed_data\ABBV\8-K_2023-07-06.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-07-27' --> 'data\processed_data\ABBV\8-K_2023-07-27.md'


2025-11-14 15:25:53,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,521 - INFO - Going to convert document batch...
2025-11-14 15:25:53,521 - INFO - Processing document 8-K_2023-10-12
2025-11-14 15:25:53,550 - INFO - Finished converting document 8-K_2023-10-12 in 0.06 sec.
2025-11-14 15:25:53,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,596 - INFO - Going to convert document batch...
2025-11-14 15:25:53,597 - INFO - Processing document 8-K_2023-10-27
2025-11-14 15:25:53,619 - INFO - Finished converting document 8-K_2023-10-27 in 0.06 sec.
2025-11-14 15:25:53,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,662 - INFO - Going to convert document batch...
2025-11-14 15:25:53,663 - INFO - Processing document 8-K_2023-11-30
2025-11-14 15:25:53,688 - INFO - Finished converting document 8-K_2023-11-30 in 0.06 sec.


Converted 'data\edgar_documents\ABBV\8-K_2023-10-04' --> 'data\processed_data\ABBV\8-K_2023-10-04.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-10-12' --> 'data\processed_data\ABBV\8-K_2023-10-12.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-10-27' --> 'data\processed_data\ABBV\8-K_2023-10-27.md'


2025-11-14 15:25:53,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,736 - INFO - Going to convert document batch...
2025-11-14 15:25:53,737 - INFO - Processing document 8-K_2023-12-06


Converted 'data\edgar_documents\ABBV\8-K_2023-11-30' --> 'data\processed_data\ABBV\8-K_2023-11-30.md'


2025-11-14 15:25:54,243 - INFO - Finished converting document 8-K_2023-12-06 in 0.53 sec.
2025-11-14 15:25:54,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,328 - INFO - Going to convert document batch...
2025-11-14 15:25:54,329 - INFO - Processing document 8-K_2024-01-05
2025-11-14 15:25:54,349 - INFO - Finished converting document 8-K_2024-01-05 in 0.08 sec.
2025-11-14 15:25:54,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,384 - INFO - Going to convert document batch...
2025-11-14 15:25:54,385 - INFO - Processing document 8-K_2024-02-02
2025-11-14 15:25:54,405 - INFO - Finished converting document 8-K_2024-02-02 in 0.05 sec.
2025-11-14 15:25:54,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,440 - INFO - Going to convert document batch...
2025-11-14 15:25:54,441 - INFO - Processing document 8-K_2024-02-12
2025-11-14 15:25:54,473 - INFO - Finished converting document 8-K_2024-02-12 in 0.

Converted 'data\edgar_documents\ABBV\8-K_2023-12-06' --> 'data\processed_data\ABBV\8-K_2023-12-06.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-01-05' --> 'data\processed_data\ABBV\8-K_2024-01-05.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-02-02' --> 'data\processed_data\ABBV\8-K_2024-02-02.md'


2025-11-14 15:25:54,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,520 - INFO - Going to convert document batch...
2025-11-14 15:25:54,521 - INFO - Processing document 8-K_2024-02-20
2025-11-14 15:25:54,550 - INFO - Finished converting document 8-K_2024-02-20 in 0.06 sec.
2025-11-14 15:25:54,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,627 - INFO - Going to convert document batch...
2025-11-14 15:25:54,628 - INFO - Processing document 8-K_2024-02-26
2025-11-14 15:25:54,667 - INFO - Finished converting document 8-K_2024-02-26 in 0.09 sec.


Converted 'data\edgar_documents\ABBV\8-K_2024-02-12' --> 'data\processed_data\ABBV\8-K_2024-02-12.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-02-20' --> 'data\processed_data\ABBV\8-K_2024-02-20.md'


2025-11-14 15:25:54,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,717 - INFO - Going to convert document batch...
2025-11-14 15:25:54,718 - INFO - Processing document 8-K_2024-04-03
2025-11-14 15:25:54,744 - INFO - Finished converting document 8-K_2024-04-03 in 0.05 sec.
2025-11-14 15:25:54,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,782 - INFO - Going to convert document batch...
2025-11-14 15:25:54,783 - INFO - Processing document 8-K_2024-04-26
2025-11-14 15:25:54,803 - INFO - Finished converting document 8-K_2024-04-26 in 0.05 sec.
2025-11-14 15:25:54,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,852 - INFO - Going to convert document batch...
2025-11-14 15:25:54,853 - INFO - Processing document 8-K_2024-05-08
2025-11-14 15:25:54,891 - INFO - Finished converting document 8-K_2024-05-08 in 0.08 sec.


Converted 'data\edgar_documents\ABBV\8-K_2024-02-26' --> 'data\processed_data\ABBV\8-K_2024-02-26.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-04-03' --> 'data\processed_data\ABBV\8-K_2024-04-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-04-26' --> 'data\processed_data\ABBV\8-K_2024-04-26.md'


2025-11-14 15:25:54,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,973 - INFO - Going to convert document batch...
2025-11-14 15:25:54,974 - INFO - Processing document 8-K_2024-07-03
2025-11-14 15:25:54,999 - INFO - Finished converting document 8-K_2024-07-03 in 0.09 sec.
2025-11-14 15:25:55,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,034 - INFO - Going to convert document batch...
2025-11-14 15:25:55,034 - INFO - Processing document 8-K_2024-07-25
2025-11-14 15:25:55,056 - INFO - Finished converting document 8-K_2024-07-25 in 0.05 sec.
2025-11-14 15:25:55,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,093 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\8-K_2024-05-08' --> 'data\processed_data\ABBV\8-K_2024-05-08.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-07-03' --> 'data\processed_data\ABBV\8-K_2024-07-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-07-25' --> 'data\processed_data\ABBV\8-K_2024-07-25.md'


2025-11-14 15:25:55,094 - INFO - Processing document 8-K_2024-09-10
2025-11-14 15:25:55,119 - INFO - Finished converting document 8-K_2024-09-10 in 0.05 sec.
2025-11-14 15:25:55,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,162 - INFO - Going to convert document batch...
2025-11-14 15:25:55,163 - INFO - Processing document 8-K_2024-10-03
2025-11-14 15:25:55,182 - INFO - Finished converting document 8-K_2024-10-03 in 0.05 sec.
2025-11-14 15:25:55,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,218 - INFO - Going to convert document batch...
2025-11-14 15:25:55,219 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:25:55,239 - INFO - Finished converting document 8-K_2024-10-30 in 0.05 sec.
2025-11-14 15:25:55,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,274 - INFO - Going to convert document batch...
2025-11-14 15:25:55,275 - INFO - Processing document 8-K_2024-12-13
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\8-K_2024-09-10' --> 'data\processed_data\ABBV\8-K_2024-09-10.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-10-03' --> 'data\processed_data\ABBV\8-K_2024-10-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-10-30' --> 'data\processed_data\ABBV\8-K_2024-10-30.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-12-13' --> 'data\processed_data\ABBV\8-K_2024-12-13.md'


2025-11-14 15:25:55,331 - INFO - Processing document 8-K_2025-01-06
2025-11-14 15:25:55,359 - INFO - Finished converting document 8-K_2025-01-06 in 0.06 sec.
2025-11-14 15:25:55,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,393 - INFO - Going to convert document batch...
2025-11-14 15:25:55,393 - INFO - Processing document 8-K_2025-01-10
2025-11-14 15:25:55,411 - INFO - Finished converting document 8-K_2025-01-10 in 0.05 sec.
2025-11-14 15:25:55,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,441 - INFO - Going to convert document batch...
2025-11-14 15:25:55,443 - INFO - Processing document 8-K_2025-01-31
2025-11-14 15:25:55,462 - INFO - Finished converting document 8-K_2025-01-31 in 0.03 sec.
2025-11-14 15:25:55,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,522 - INFO - Going to convert document batch...
2025-11-14 15:25:55,524 - INFO - Processing document 8-K_2025-02-05
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\8-K_2025-01-06' --> 'data\processed_data\ABBV\8-K_2025-01-06.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-01-10' --> 'data\processed_data\ABBV\8-K_2025-01-10.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-01-31' --> 'data\processed_data\ABBV\8-K_2025-01-31.md'


2025-11-14 15:25:55,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,592 - INFO - Going to convert document batch...
2025-11-14 15:25:55,593 - INFO - Processing document 8-K_2025-02-14
2025-11-14 15:25:55,623 - INFO - Finished converting document 8-K_2025-02-14 in 0.06 sec.
2025-11-14 15:25:55,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,668 - INFO - Going to convert document batch...
2025-11-14 15:25:55,669 - INFO - Processing document 8-K_2025-02-19
2025-11-14 15:25:55,699 - INFO - Finished converting document 8-K_2025-02-19 in 0.06 sec.


Converted 'data\edgar_documents\ABBV\8-K_2025-02-05' --> 'data\processed_data\ABBV\8-K_2025-02-05.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-02-14' --> 'data\processed_data\ABBV\8-K_2025-02-14.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-02-19' --> 'data\processed_data\ABBV\8-K_2025-02-19.md'


2025-11-14 15:25:55,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,783 - INFO - Going to convert document batch...
2025-11-14 15:25:55,784 - INFO - Processing document 8-K_2025-02-26
2025-11-14 15:25:55,819 - INFO - Finished converting document 8-K_2025-02-26 in 0.09 sec.
2025-11-14 15:25:55,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,867 - INFO - Going to convert document batch...
2025-11-14 15:25:55,867 - INFO - Processing document 8-K_2025-04-03
2025-11-14 15:25:55,887 - INFO - Finished converting document 8-K_2025-04-03 in 0.05 sec.
2025-11-14 15:25:55,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,921 - INFO - Going to convert document batch...
2025-11-14 15:25:55,922 - INFO - Processing document 8-K_2025-04-25
2025-11-14 15:25:55,942 - INFO - Finished converting document 8-K_2025-04-25 in 0.05 sec.
2025-11-14 15:25:55,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ABBV\8-K_2025-02-26' --> 'data\processed_data\ABBV\8-K_2025-02-26.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-04-03' --> 'data\processed_data\ABBV\8-K_2025-04-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-04-25' --> 'data\processed_data\ABBV\8-K_2025-04-25.md'


2025-11-14 15:25:56,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,059 - INFO - Going to convert document batch...
2025-11-14 15:25:56,059 - INFO - Processing document 8-K_2025-07-03
2025-11-14 15:25:56,081 - INFO - Finished converting document 8-K_2025-07-03 in 0.05 sec.
2025-11-14 15:25:56,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,143 - INFO - Going to convert document batch...
2025-11-14 15:25:56,144 - INFO - Processing document 8-K_2025-07-31
2025-11-14 15:25:56,166 - INFO - Finished converting document 8-K_2025-07-31 in 0.06 sec.
2025-11-14 15:25:56,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,197 - INFO - Going to convert document batch...
2025-11-14 15:25:56,198 - INFO - Processing document 8-K_2025-09-11


Converted 'data\edgar_documents\ABBV\8-K_2025-05-13' --> 'data\processed_data\ABBV\8-K_2025-05-13.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-07-03' --> 'data\processed_data\ABBV\8-K_2025-07-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-07-31' --> 'data\processed_data\ABBV\8-K_2025-07-31.md'


2025-11-14 15:25:56,217 - INFO - Finished converting document 8-K_2025-09-11 in 0.05 sec.
2025-11-14 15:25:56,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,263 - INFO - Going to convert document batch...
2025-11-14 15:25:56,264 - INFO - Processing document 8-K_2025-10-03
2025-11-14 15:25:56,284 - INFO - Finished converting document 8-K_2025-10-03 in 0.05 sec.
2025-11-14 15:25:56,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,321 - INFO - Going to convert document batch...
2025-11-14 15:25:56,321 - INFO - Processing document 8-K_2025-10-31
2025-11-14 15:25:56,339 - INFO - Finished converting document 8-K_2025-10-31 in 0.05 sec.
2025-11-14 15:25:56,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\8-K_2025-09-11' --> 'data\processed_data\ABBV\8-K_2025-09-11.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-10-03' --> 'data\processed_data\ABBV\8-K_2025-10-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-10-31' --> 'data\processed_data\ABBV\8-K_2025-10-31.md'


2025-11-14 15:25:57,301 - INFO - Going to convert document batch...
2025-11-14 15:25:57,302 - INFO - Processing document DEF-14A_2023-03-20
2025-11-14 15:26:01,382 - INFO - Finished converting document DEF-14A_2023-03-20 in 5.03 sec.
2025-11-14 15:26:02,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\DEF-14A_2023-03-20' --> 'data\processed_data\ABBV\DEF-14A_2023-03-20.md'


2025-11-14 15:26:02,778 - INFO - Going to convert document batch...
2025-11-14 15:26:02,779 - INFO - Processing document DEF-14A_2024-03-18
2025-11-14 15:26:06,912 - INFO - Finished converting document DEF-14A_2024-03-18 in 4.83 sec.
2025-11-14 15:26:07,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\DEF-14A_2024-03-18' --> 'data\processed_data\ABBV\DEF-14A_2024-03-18.md'


2025-11-14 15:26:08,382 - INFO - Going to convert document batch...
2025-11-14 15:26:08,383 - INFO - Processing document DEF-14A_2025-03-24
2025-11-14 15:26:12,953 - INFO - Finished converting document DEF-14A_2025-03-24 in 5.34 sec.
2025-11-14 15:26:13,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\DEF-14A_2025-03-24' --> 'data\processed_data\ABBV\DEF-14A_2025-03-24.md'
Processed 109 new files. Errors: 3
Found 82 files to process in data\edgar_documents\ABT


2025-11-14 15:26:14,283 - INFO - Going to convert document batch...
2025-11-14 15:26:14,284 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:26:14,285 - INFO - Processing document 10-K_2023-02-17
2025-11-14 15:26:15,370 - INFO - Finished converting document 10-K_2023-02-17 in 1.69 sec.
2025-11-14 15:26:15,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-K_2023-02-17' --> 'data\processed_data\ABT\10-K_2023-02-17.md'


2025-11-14 15:26:16,907 - INFO - Going to convert document batch...
2025-11-14 15:26:16,908 - INFO - Processing document 10-K_2024-02-16
2025-11-14 15:26:17,975 - INFO - Finished converting document 10-K_2024-02-16 in 2.11 sec.
2025-11-14 15:26:18,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-K_2024-02-16' --> 'data\processed_data\ABT\10-K_2024-02-16.md'


2025-11-14 15:26:19,426 - INFO - Going to convert document batch...
2025-11-14 15:26:19,428 - INFO - Processing document 10-K_2025-02-21
2025-11-14 15:26:20,555 - INFO - Finished converting document 10-K_2025-02-21 in 2.09 sec.
2025-11-14 15:26:21,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-K_2025-02-21' --> 'data\processed_data\ABT\10-K_2025-02-21.md'


2025-11-14 15:26:21,308 - INFO - Going to convert document batch...
2025-11-14 15:26:21,309 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 15:26:21,727 - INFO - Finished converting document 10-Q_2023-05-04 in 0.67 sec.
2025-11-14 15:26:21,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2023-05-04' --> 'data\processed_data\ABT\10-Q_2023-05-04.md'


2025-11-14 15:26:22,690 - INFO - Going to convert document batch...
2025-11-14 15:26:22,690 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 15:26:23,302 - INFO - Finished converting document 10-Q_2023-08-03 in 1.34 sec.
2025-11-14 15:26:23,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2023-08-03' --> 'data\processed_data\ABT\10-Q_2023-08-03.md'


2025-11-14 15:26:23,950 - INFO - Going to convert document batch...
2025-11-14 15:26:23,951 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 15:26:24,550 - INFO - Finished converting document 10-Q_2023-11-01 in 0.95 sec.
2025-11-14 15:26:25,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2023-11-01' --> 'data\processed_data\ABT\10-Q_2023-11-01.md'


2025-11-14 15:26:25,399 - INFO - Going to convert document batch...
2025-11-14 15:26:25,400 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 15:26:25,829 - INFO - Finished converting document 10-Q_2024-05-02 in 0.67 sec.
2025-11-14 15:26:26,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2024-05-02' --> 'data\processed_data\ABT\10-Q_2024-05-02.md'


2025-11-14 15:26:26,406 - INFO - Going to convert document batch...
2025-11-14 15:26:26,407 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 15:26:27,024 - INFO - Finished converting document 10-Q_2024-07-31 in 0.95 sec.
2025-11-14 15:26:27,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2024-07-31' --> 'data\processed_data\ABT\10-Q_2024-07-31.md'


2025-11-14 15:26:27,953 - INFO - Going to convert document batch...
2025-11-14 15:26:27,954 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 15:26:28,543 - INFO - Finished converting document 10-Q_2024-10-31 in 1.23 sec.
2025-11-14 15:26:28,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2024-10-31' --> 'data\processed_data\ABT\10-Q_2024-10-31.md'


2025-11-14 15:26:29,104 - INFO - Going to convert document batch...
2025-11-14 15:26:29,105 - INFO - Processing document 10-Q_2025-04-30
2025-11-14 15:26:29,568 - INFO - Finished converting document 10-Q_2025-04-30 in 0.73 sec.
2025-11-14 15:26:29,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2025-04-30' --> 'data\processed_data\ABT\10-Q_2025-04-30.md'


2025-11-14 15:26:30,449 - INFO - Going to convert document batch...
2025-11-14 15:26:30,450 - INFO - Processing document 10-Q_2025-07-30
2025-11-14 15:26:31,120 - INFO - Finished converting document 10-Q_2025-07-30 in 1.33 sec.
2025-11-14 15:26:31,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2025-07-30' --> 'data\processed_data\ABT\10-Q_2025-07-30.md'


2025-11-14 15:26:32,093 - INFO - Going to convert document batch...
2025-11-14 15:26:32,094 - INFO - Processing document 10-Q_2025-10-29
2025-11-14 15:26:32,732 - INFO - Finished converting document 10-Q_2025-10-29 in 1.30 sec.
2025-11-14 15:26:33,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,086 - INFO - Going to convert document batch...
2025-11-14 15:26:33,087 - INFO - Processing document 4_2023-01-03
2025-11-14 15:26:33,108 - INFO - Finished converting document 4_2023-01-03 in 0.05 sec.
2025-11-14 15:26:33,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,152 - INFO - Going to convert document batch...
2025-11-14 15:26:33,152 - INFO - Processing document 4_2023-01-04
2025-11-14 15:26:33,172 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 15:26:33,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,230 - INFO - Going to convert document batch...
2025-11-14 15:26:33,

Converted 'data\edgar_documents\ABT\10-Q_2025-10-29' --> 'data\processed_data\ABT\10-Q_2025-10-29.md'
Converted 'data\edgar_documents\ABT\4_2023-01-03' --> 'data\processed_data\ABT\4_2023-01-03.md'
Converted 'data\edgar_documents\ABT\4_2023-01-04' --> 'data\processed_data\ABT\4_2023-01-04.md'


2025-11-14 15:26:33,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,298 - INFO - Going to convert document batch...
2025-11-14 15:26:33,299 - INFO - Processing document 4_2023-03-02
2025-11-14 15:26:33,321 - INFO - Finished converting document 4_2023-03-02 in 0.05 sec.
2025-11-14 15:26:33,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,385 - INFO - Going to convert document batch...
2025-11-14 15:26:33,386 - INFO - Processing document 4_2023-04-04
2025-11-14 15:26:33,407 - INFO - Finished converting document 4_2023-04-04 in 0.06 sec.
2025-11-14 15:26:33,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\4_2023-02-22' --> 'data\processed_data\ABT\4_2023-02-22.md'
Converted 'data\edgar_documents\ABT\4_2023-03-02' --> 'data\processed_data\ABT\4_2023-03-02.md'
Converted 'data\edgar_documents\ABT\4_2023-04-04' --> 'data\processed_data\ABT\4_2023-04-04.md'


2025-11-14 15:26:33,473 - INFO - Going to convert document batch...
2025-11-14 15:26:33,474 - INFO - Processing document 4_2023-05-02
2025-11-14 15:26:33,492 - INFO - Finished converting document 4_2023-05-02 in 0.05 sec.
2025-11-14 15:26:33,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,540 - INFO - Going to convert document batch...
2025-11-14 15:26:33,541 - INFO - Processing document 4_2023-05-03
2025-11-14 15:26:33,561 - INFO - Finished converting document 4_2023-05-03 in 0.05 sec.
2025-11-14 15:26:33,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,610 - INFO - Going to convert document batch...
2025-11-14 15:26:33,610 - INFO - Processing document 4_2023-06-20
2025-11-14 15:26:33,633 - INFO - Finished converting document 4_2023-06-20 in 0.03 sec.
2025-11-14 15:26:33,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,678 - INFO - Going to convert document batch...
2025-11-14 15:26:33,679 - 

Converted 'data\edgar_documents\ABT\4_2023-05-02' --> 'data\processed_data\ABT\4_2023-05-02.md'
Converted 'data\edgar_documents\ABT\4_2023-05-03' --> 'data\processed_data\ABT\4_2023-05-03.md'
Converted 'data\edgar_documents\ABT\4_2023-06-20' --> 'data\processed_data\ABT\4_2023-06-20.md'


2025-11-14 15:26:33,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,756 - INFO - Going to convert document batch...
2025-11-14 15:26:33,757 - INFO - Processing document 4_2023-07-28
2025-11-14 15:26:33,805 - INFO - Finished converting document 4_2023-07-28 in 0.08 sec.
2025-11-14 15:26:33,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,890 - INFO - Going to convert document batch...
2025-11-14 15:26:33,891 - INFO - Processing document 4_2023-08-10
2025-11-14 15:26:33,916 - INFO - Finished converting document 4_2023-08-10 in 0.06 sec.


Converted 'data\edgar_documents\ABT\4_2023-07-05' --> 'data\processed_data\ABT\4_2023-07-05.md'
Converted 'data\edgar_documents\ABT\4_2023-07-28' --> 'data\processed_data\ABT\4_2023-07-28.md'


2025-11-14 15:26:33,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,963 - INFO - Going to convert document batch...
2025-11-14 15:26:33,964 - INFO - Processing document 4_2023-09-06
2025-11-14 15:26:33,985 - INFO - Finished converting document 4_2023-09-06 in 0.05 sec.
2025-11-14 15:26:34,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,030 - INFO - Going to convert document batch...
2025-11-14 15:26:34,031 - INFO - Processing document 4_2023-09-15
2025-11-14 15:26:34,052 - INFO - Finished converting document 4_2023-09-15 in 0.05 sec.
2025-11-14 15:26:34,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,114 - INFO - Going to convert document batch...
2025-11-14 15:26:34,115 - INFO - Processing document 4_2023-10-03
2025-11-14 15:26:34,134 - INFO - Finished converting document 4_2023-10-03 in 0.05 sec.


Converted 'data\edgar_documents\ABT\4_2023-08-10' --> 'data\processed_data\ABT\4_2023-08-10.md'
Converted 'data\edgar_documents\ABT\4_2023-09-06' --> 'data\processed_data\ABT\4_2023-09-06.md'
Converted 'data\edgar_documents\ABT\4_2023-09-15' --> 'data\processed_data\ABT\4_2023-09-15.md'


2025-11-14 15:26:34,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,180 - INFO - Going to convert document batch...
2025-11-14 15:26:34,181 - INFO - Processing document 4_2023-10-30
2025-11-14 15:26:34,256 - INFO - Finished converting document 4_2023-10-30 in 0.09 sec.
2025-11-14 15:26:34,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,337 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABT\4_2023-10-03' --> 'data\processed_data\ABT\4_2023-10-03.md'
Converted 'data\edgar_documents\ABT\4_2023-10-30' --> 'data\processed_data\ABT\4_2023-10-30.md'


2025-11-14 15:26:34,338 - INFO - Processing document 4_2023-12-18
2025-11-14 15:26:34,374 - INFO - Finished converting document 4_2023-12-18 in 0.09 sec.
2025-11-14 15:26:34,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,415 - INFO - Going to convert document batch...
2025-11-14 15:26:34,416 - INFO - Processing document 4_2024-01-03
2025-11-14 15:26:34,435 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:26:34,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,479 - INFO - Going to convert document batch...
2025-11-14 15:26:34,481 - INFO - Processing document 4_2024-01-31
2025-11-14 15:26:34,503 - INFO - Finished converting document 4_2024-01-31 in 0.05 sec.
2025-11-14 15:26:34,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,546 - INFO - Going to convert document batch...
2025-11-14 15:26:34,547 - INFO - Processing document 4_2024-02-23
2025-11-14 15:26:34,566 - IN

Converted 'data\edgar_documents\ABT\4_2023-12-18' --> 'data\processed_data\ABT\4_2023-12-18.md'
Converted 'data\edgar_documents\ABT\4_2024-01-03' --> 'data\processed_data\ABT\4_2024-01-03.md'
Converted 'data\edgar_documents\ABT\4_2024-01-31' --> 'data\processed_data\ABT\4_2024-01-31.md'


2025-11-14 15:26:34,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,608 - INFO - Going to convert document batch...
2025-11-14 15:26:34,609 - INFO - Processing document 4_2024-02-27
2025-11-14 15:26:34,631 - INFO - Finished converting document 4_2024-02-27 in 0.05 sec.
2025-11-14 15:26:34,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,671 - INFO - Going to convert document batch...
2025-11-14 15:26:34,671 - INFO - Processing document 4_2024-03-04
2025-11-14 15:26:34,687 - INFO - Finished converting document 4_2024-03-04 in 0.03 sec.
2025-11-14 15:26:34,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,728 - INFO - Going to convert document batch...
2025-11-14 15:26:34,729 - INFO - Processing document 4_2024-04-02
2025-11-14 15:26:34,752 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.


Converted 'data\edgar_documents\ABT\4_2024-02-23' --> 'data\processed_data\ABT\4_2024-02-23.md'
Converted 'data\edgar_documents\ABT\4_2024-02-27' --> 'data\processed_data\ABT\4_2024-02-27.md'
Converted 'data\edgar_documents\ABT\4_2024-03-04' --> 'data\processed_data\ABT\4_2024-03-04.md'
Converted 'data\edgar_documents\ABT\4_2024-04-02' --> 'data\processed_data\ABT\4_2024-04-02.md'


2025-11-14 15:26:34,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,809 - INFO - Going to convert document batch...
2025-11-14 15:26:34,810 - INFO - Processing document 4_2024-04-30
2025-11-14 15:26:34,828 - INFO - Finished converting document 4_2024-04-30 in 0.06 sec.
2025-11-14 15:26:34,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,870 - INFO - Going to convert document batch...
2025-11-14 15:26:34,871 - INFO - Processing document 4_2024-05-08
2025-11-14 15:26:34,889 - INFO - Finished converting document 4_2024-05-08 in 0.05 sec.
2025-11-14 15:26:34,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,930 - INFO - Going to convert document batch...
2025-11-14 15:26:34,932 - INFO - Processing document 4_2024-05-14
2025-11-14 15:26:34,956 - INFO - Finished converting document 4_2024-05-14 in 0.05 sec.
2025-11-14 15:26:34,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ABT\4_2024-04-30' --> 'data\processed_data\ABT\4_2024-04-30.md'
Converted 'data\edgar_documents\ABT\4_2024-05-08' --> 'data\processed_data\ABT\4_2024-05-08.md'
Converted 'data\edgar_documents\ABT\4_2024-05-14' --> 'data\processed_data\ABT\4_2024-05-14.md'
Converted 'data\edgar_documents\ABT\4_2024-07-02' --> 'data\processed_data\ABT\4_2024-07-02.md'


2025-11-14 15:26:35,064 - INFO - Going to convert document batch...
2025-11-14 15:26:35,065 - INFO - Processing document 4_2024-09-04
2025-11-14 15:26:35,087 - INFO - Finished converting document 4_2024-09-04 in 0.03 sec.
2025-11-14 15:26:35,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,133 - INFO - Going to convert document batch...
2025-11-14 15:26:35,134 - INFO - Processing document 4_2024-09-13
2025-11-14 15:26:35,160 - INFO - Finished converting document 4_2024-09-13 in 0.05 sec.
2025-11-14 15:26:35,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,231 - INFO - Going to convert document batch...
2025-11-14 15:26:35,232 - INFO - Processing document 4_2024-10-01
2025-11-14 15:26:35,256 - INFO - Finished converting document 4_2024-10-01 in 0.06 sec.
2025-11-14 15:26:35,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,298 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABT\4_2024-09-04' --> 'data\processed_data\ABT\4_2024-09-04.md'
Converted 'data\edgar_documents\ABT\4_2024-09-13' --> 'data\processed_data\ABT\4_2024-09-13.md'
Converted 'data\edgar_documents\ABT\4_2024-10-01' --> 'data\processed_data\ABT\4_2024-10-01.md'


2025-11-14 15:26:35,299 - INFO - Processing document 4_2024-10-23
2025-11-14 15:26:35,323 - INFO - Finished converting document 4_2024-10-23 in 0.06 sec.
2025-11-14 15:26:35,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,389 - INFO - Going to convert document batch...
2025-11-14 15:26:35,390 - INFO - Processing document 4_2025-01-03
2025-11-14 15:26:35,408 - INFO - Finished converting document 4_2025-01-03 in 0.06 sec.
2025-11-14 15:26:35,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,449 - INFO - Going to convert document batch...
2025-11-14 15:26:35,450 - INFO - Processing document 4_2025-01-30
2025-11-14 15:26:35,468 - INFO - Finished converting document 4_2025-01-30 in 0.05 sec.
2025-11-14 15:26:35,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,512 - INFO - Going to convert document batch...
2025-11-14 15:26:35,514 - INFO - Processing document 4_2025-01-31
2025-11-14 15:26:35,540 - IN

Converted 'data\edgar_documents\ABT\4_2024-10-23' --> 'data\processed_data\ABT\4_2024-10-23.md'
Converted 'data\edgar_documents\ABT\4_2025-01-03' --> 'data\processed_data\ABT\4_2025-01-03.md'
Converted 'data\edgar_documents\ABT\4_2025-01-30' --> 'data\processed_data\ABT\4_2025-01-30.md'


2025-11-14 15:26:35,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,611 - INFO - Going to convert document batch...
2025-11-14 15:26:35,613 - INFO - Processing document 4_2025-02-07
2025-11-14 15:26:35,640 - INFO - Finished converting document 4_2025-02-07 in 0.08 sec.
2025-11-14 15:26:35,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,689 - INFO - Going to convert document batch...
2025-11-14 15:26:35,690 - INFO - Processing document 4_2025-02-27
2025-11-14 15:26:35,709 - INFO - Finished converting document 4_2025-02-27 in 0.05 sec.
2025-11-14 15:26:35,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\4_2025-01-31' --> 'data\processed_data\ABT\4_2025-01-31.md'
Converted 'data\edgar_documents\ABT\4_2025-02-07' --> 'data\processed_data\ABT\4_2025-02-07.md'
Converted 'data\edgar_documents\ABT\4_2025-02-27' --> 'data\processed_data\ABT\4_2025-02-27.md'


2025-11-14 15:26:35,753 - INFO - Going to convert document batch...
2025-11-14 15:26:35,754 - INFO - Processing document 4_2025-03-04
2025-11-14 15:26:35,772 - INFO - Finished converting document 4_2025-03-04 in 0.03 sec.
2025-11-14 15:26:35,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,816 - INFO - Going to convert document batch...
2025-11-14 15:26:35,817 - INFO - Processing document 4_2025-03-07
2025-11-14 15:26:35,840 - INFO - Finished converting document 4_2025-03-07 in 0.05 sec.
2025-11-14 15:26:35,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,885 - INFO - Going to convert document batch...
2025-11-14 15:26:35,885 - INFO - Processing document 4_2025-04-02
2025-11-14 15:26:35,904 - INFO - Finished converting document 4_2025-04-02 in 0.05 sec.
2025-11-14 15:26:35,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,944 - INFO - Going to convert document batch...
2025-11-14 15:26:35,945 - 

Converted 'data\edgar_documents\ABT\4_2025-03-04' --> 'data\processed_data\ABT\4_2025-03-04.md'
Converted 'data\edgar_documents\ABT\4_2025-03-07' --> 'data\processed_data\ABT\4_2025-03-07.md'
Converted 'data\edgar_documents\ABT\4_2025-04-02' --> 'data\processed_data\ABT\4_2025-04-02.md'


2025-11-14 15:26:35,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,007 - INFO - Going to convert document batch...
2025-11-14 15:26:36,008 - INFO - Processing document 4_2025-05-02
2025-11-14 15:26:36,027 - INFO - Finished converting document 4_2025-05-02 in 0.05 sec.
2025-11-14 15:26:36,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,089 - INFO - Going to convert document batch...
2025-11-14 15:26:36,090 - INFO - Processing document 4_2025-07-01
2025-11-14 15:26:36,108 - INFO - Finished converting document 4_2025-07-01 in 0.06 sec.
2025-11-14 15:26:36,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,150 - INFO - Going to convert document batch...
2025-11-14 15:26:36,151 - INFO - Processing document 4_2025-08-11
2025-11-14 15:26:36,168 - INFO - Finished converting document 4_2025-08-11 in 0.05 sec.


Converted 'data\edgar_documents\ABT\4_2025-04-29' --> 'data\processed_data\ABT\4_2025-04-29.md'
Converted 'data\edgar_documents\ABT\4_2025-05-02' --> 'data\processed_data\ABT\4_2025-05-02.md'
Converted 'data\edgar_documents\ABT\4_2025-07-01' --> 'data\processed_data\ABT\4_2025-07-01.md'


2025-11-14 15:26:36,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,212 - INFO - Going to convert document batch...
2025-11-14 15:26:36,213 - INFO - Processing document 4_2025-09-03
2025-11-14 15:26:36,234 - INFO - Finished converting document 4_2025-09-03 in 0.05 sec.
2025-11-14 15:26:36,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,302 - INFO - Going to convert document batch...
2025-11-14 15:26:36,303 - INFO - Processing document 4_2025-10-02
2025-11-14 15:26:36,323 - INFO - Finished converting document 4_2025-10-02 in 0.08 sec.


Converted 'data\edgar_documents\ABT\4_2025-08-11' --> 'data\processed_data\ABT\4_2025-08-11.md'
Converted 'data\edgar_documents\ABT\4_2025-09-03' --> 'data\processed_data\ABT\4_2025-09-03.md'
Converted 'data\edgar_documents\ABT\4_2025-10-02' --> 'data\processed_data\ABT\4_2025-10-02.md'


2025-11-14 15:26:36,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,432 - INFO - Going to convert document batch...
2025-11-14 15:26:36,434 - INFO - Processing document 8-K_2023-01-25
2025-11-14 15:26:36,466 - INFO - Finished converting document 8-K_2023-01-25 in 0.11 sec.
2025-11-14 15:26:36,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,510 - INFO - Going to convert document batch...
2025-11-14 15:26:36,511 - INFO - Processing document 8-K_2023-02-17
2025-11-14 15:26:36,529 - INFO - Finished converting document 8-K_2023-02-17 in 0.05 sec.
2025-11-14 15:26:36,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,566 - INFO - Going to convert document batch...
2025-11-14 15:26:36,567 - INFO - Processing document 8-K_2023-04-19
2025-11-14 15:26:36,582 - INFO - Finished converting document 8-K_2023-04-19 in 0.03 sec.
2025-11-14 15:26:36,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ABT\8-K_2023-01-25' --> 'data\processed_data\ABT\8-K_2023-01-25.md'
Converted 'data\edgar_documents\ABT\8-K_2023-02-17' --> 'data\processed_data\ABT\8-K_2023-02-17.md'
Converted 'data\edgar_documents\ABT\8-K_2023-04-19' --> 'data\processed_data\ABT\8-K_2023-04-19.md'


2025-11-14 15:26:36,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,784 - INFO - Going to convert document batch...
2025-11-14 15:26:36,786 - INFO - Processing document 8-K_2023-06-09
2025-11-14 15:26:36,811 - INFO - Finished converting document 8-K_2023-06-09 in 0.12 sec.
2025-11-14 15:26:36,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,872 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABT\8-K_2023-05-02' --> 'data\processed_data\ABT\8-K_2023-05-02.md'
Converted 'data\edgar_documents\ABT\8-K_2023-06-09' --> 'data\processed_data\ABT\8-K_2023-06-09.md'


2025-11-14 15:26:36,873 - INFO - Processing document 8-K_2023-06-12
2025-11-14 15:26:36,895 - INFO - Finished converting document 8-K_2023-06-12 in 0.06 sec.
2025-11-14 15:26:36,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,939 - INFO - Going to convert document batch...
2025-11-14 15:26:36,940 - INFO - Processing document 8-K_2023-07-20
2025-11-14 15:26:36,956 - INFO - Finished converting document 8-K_2023-07-20 in 0.05 sec.
2025-11-14 15:26:36,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,988 - INFO - Going to convert document batch...
2025-11-14 15:26:36,989 - INFO - Processing document 8-K_2023-09-01
2025-11-14 15:26:37,005 - INFO - Finished converting document 8-K_2023-09-01 in 0.03 sec.
2025-11-14 15:26:37,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,042 - INFO - Going to convert document batch...
2025-11-14 15:26:37,043 - INFO - Processing document 8-K_2023-10-18
2025-11-14 15:

Converted 'data\edgar_documents\ABT\8-K_2023-06-12' --> 'data\processed_data\ABT\8-K_2023-06-12.md'
Converted 'data\edgar_documents\ABT\8-K_2023-07-20' --> 'data\processed_data\ABT\8-K_2023-07-20.md'
Converted 'data\edgar_documents\ABT\8-K_2023-09-01' --> 'data\processed_data\ABT\8-K_2023-09-01.md'
Converted 'data\edgar_documents\ABT\8-K_2023-10-18' --> 'data\processed_data\ABT\8-K_2023-10-18.md'


2025-11-14 15:26:37,094 - INFO - Processing document 8-K_2024-01-24
2025-11-14 15:26:37,109 - INFO - Finished converting document 8-K_2024-01-24 in 0.05 sec.
2025-11-14 15:26:37,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,149 - INFO - Going to convert document batch...
2025-11-14 15:26:37,150 - INFO - Processing document 8-K_2024-01-29


Converted 'data\edgar_documents\ABT\8-K_2024-01-24' --> 'data\processed_data\ABT\8-K_2024-01-24.md'


2025-11-14 15:26:37,550 - INFO - Finished converting document 8-K_2024-01-29 in 0.42 sec.
2025-11-14 15:26:37,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,590 - INFO - Going to convert document batch...
2025-11-14 15:26:37,590 - INFO - Processing document 8-K_2024-04-17
2025-11-14 15:26:37,604 - INFO - Finished converting document 8-K_2024-04-17 in 0.05 sec.
2025-11-14 15:26:37,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,649 - INFO - Going to convert document batch...
2025-11-14 15:26:37,649 - INFO - Processing document 8-K_2024-04-29
2025-11-14 15:26:37,676 - INFO - Finished converting document 8-K_2024-04-29 in 0.06 sec.
2025-11-14 15:26:37,707 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,717 - INFO - Going to convert document batch...
2025-11-14 15:26:37,717 - INFO - Processing document 8-K_2024-05-01
2025-11-14 15:26:37,736 - INFO - Finished converting document 8-K_2024-05-01 in 0.

Converted 'data\edgar_documents\ABT\8-K_2024-01-29' --> 'data\processed_data\ABT\8-K_2024-01-29.md'
Converted 'data\edgar_documents\ABT\8-K_2024-04-17' --> 'data\processed_data\ABT\8-K_2024-04-17.md'
Converted 'data\edgar_documents\ABT\8-K_2024-04-29' --> 'data\processed_data\ABT\8-K_2024-04-29.md'


2025-11-14 15:26:37,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,771 - INFO - Going to convert document batch...
2025-11-14 15:26:37,772 - INFO - Processing document 8-K_2024-07-18
2025-11-14 15:26:37,788 - INFO - Finished converting document 8-K_2024-07-18 in 0.03 sec.
2025-11-14 15:26:37,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,819 - INFO - Going to convert document batch...
2025-11-14 15:26:37,821 - INFO - Processing document 8-K_2024-10-16
2025-11-14 15:26:37,837 - INFO - Finished converting document 8-K_2024-10-16 in 0.03 sec.
2025-11-14 15:26:37,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,869 - INFO - Going to convert document batch...
2025-11-14 15:26:37,870 - INFO - Processing document 8-K_2024-11-15
2025-11-14 15:26:37,887 - INFO - Finished converting document 8-K_2024-11-15 in 0.05 sec.
2025-11-14 15:26:37,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ABT\8-K_2024-05-01' --> 'data\processed_data\ABT\8-K_2024-05-01.md'
Converted 'data\edgar_documents\ABT\8-K_2024-07-18' --> 'data\processed_data\ABT\8-K_2024-07-18.md'
Converted 'data\edgar_documents\ABT\8-K_2024-10-16' --> 'data\processed_data\ABT\8-K_2024-10-16.md'
Converted 'data\edgar_documents\ABT\8-K_2024-11-15' --> 'data\processed_data\ABT\8-K_2024-11-15.md'


2025-11-14 15:26:37,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,969 - INFO - Going to convert document batch...
2025-11-14 15:26:37,970 - INFO - Processing document 8-K_2025-04-16
2025-11-14 15:26:37,987 - INFO - Finished converting document 8-K_2025-04-16 in 0.03 sec.
2025-11-14 15:26:38,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:38,030 - INFO - Going to convert document batch...
2025-11-14 15:26:38,031 - INFO - Processing document 8-K_2025-04-28
2025-11-14 15:26:38,062 - INFO - Finished converting document 8-K_2025-04-28 in 0.06 sec.
2025-11-14 15:26:38,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:38,103 - INFO - Going to convert document batch...
2025-11-14 15:26:38,104 - INFO - Processing document 8-K_2025-05-01
2025-11-14 15:26:38,120 - INFO - Finished converting document 8-K_2025-05-01 in 0.05 sec.
2025-11-14 15:26:38,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\8-K_2025-01-22' --> 'data\processed_data\ABT\8-K_2025-01-22.md'
Converted 'data\edgar_documents\ABT\8-K_2025-04-16' --> 'data\processed_data\ABT\8-K_2025-04-16.md'
Converted 'data\edgar_documents\ABT\8-K_2025-04-28' --> 'data\processed_data\ABT\8-K_2025-04-28.md'
Converted 'data\edgar_documents\ABT\8-K_2025-05-01' --> 'data\processed_data\ABT\8-K_2025-05-01.md'


2025-11-14 15:26:38,153 - INFO - Going to convert document batch...
2025-11-14 15:26:38,154 - INFO - Processing document 8-K_2025-07-17
2025-11-14 15:26:38,170 - INFO - Finished converting document 8-K_2025-07-17 in 0.05 sec.
2025-11-14 15:26:38,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:38,203 - INFO - Going to convert document batch...
2025-11-14 15:26:38,204 - INFO - Processing document 8-K_2025-10-15
2025-11-14 15:26:38,220 - INFO - Finished converting document 8-K_2025-10-15 in 0.05 sec.
2025-11-14 15:26:38,266 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:26:38,267 - ERROR - Input document DEF-14A_2023-03-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputForm

Converted 'data\edgar_documents\ABT\8-K_2025-07-17' --> 'data\processed_data\ABT\8-K_2025-07-17.md'
Converted 'data\edgar_documents\ABT\8-K_2025-10-15' --> 'data\processed_data\ABT\8-K_2025-10-15.md'
Error processing data\edgar_documents\ABT\DEF-14A_2023-03-17: File format not allowed: data\edgar_documents\ABT\DEF-14A_2023-03-17


2025-11-14 15:26:38,708 - INFO - Going to convert document batch...
2025-11-14 15:26:38,709 - INFO - Processing document DEF-14A_2024-03-15
2025-11-14 15:26:44,422 - INFO - Finished converting document DEF-14A_2024-03-15 in 6.16 sec.


Converted 'data\edgar_documents\ABT\DEF-14A_2024-03-15' --> 'data\processed_data\ABT\DEF-14A_2024-03-15.md'


2025-11-14 15:26:45,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:46,202 - INFO - Going to convert document batch...
2025-11-14 15:26:46,203 - INFO - Processing document DEF-14A_2025-03-14
2025-11-14 15:26:57,389 - INFO - Finished converting document DEF-14A_2025-03-14 in 12.28 sec.
2025-11-14 15:26:58,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\DEF-14A_2025-03-14' --> 'data\processed_data\ABT\DEF-14A_2025-03-14.md'
Processed 81 new files. Errors: 1
Found 153 files to process in data\edgar_documents\ACN


2025-11-14 15:26:59,272 - INFO - Going to convert document batch...
2025-11-14 15:26:59,273 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:26:59,274 - INFO - Processing document 10-K_2023-10-12
2025-11-14 15:27:01,081 - INFO - Finished converting document 10-K_2023-10-12 in 2.80 sec.
2025-11-14 15:27:01,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-K_2023-10-12' --> 'data\processed_data\ACN\10-K_2023-10-12.md'


2025-11-14 15:27:02,663 - INFO - Going to convert document batch...
2025-11-14 15:27:02,664 - INFO - Processing document 10-K_2024-10-10
2025-11-14 15:27:04,496 - INFO - Finished converting document 10-K_2024-10-10 in 2.78 sec.
2025-11-14 15:27:05,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-K_2024-10-10' --> 'data\processed_data\ACN\10-K_2024-10-10.md'


2025-11-14 15:27:06,273 - INFO - Going to convert document batch...
2025-11-14 15:27:06,274 - INFO - Processing document 10-K_2025-10-10
2025-11-14 15:27:08,122 - INFO - Finished converting document 10-K_2025-10-10 in 2.95 sec.
2025-11-14 15:27:08,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-K_2025-10-10' --> 'data\processed_data\ACN\10-K_2025-10-10.md'


2025-11-14 15:27:09,221 - INFO - Going to convert document batch...
2025-11-14 15:27:09,221 - INFO - Processing document 10-Q_2023-03-23
2025-11-14 15:27:10,027 - INFO - Finished converting document 10-Q_2023-03-23 in 1.20 sec.
2025-11-14 15:27:10,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2023-03-23' --> 'data\processed_data\ACN\10-Q_2023-03-23.md'


2025-11-14 15:27:11,371 - INFO - Going to convert document batch...
2025-11-14 15:27:11,372 - INFO - Processing document 10-Q_2023-06-22
2025-11-14 15:27:12,192 - INFO - Finished converting document 10-Q_2023-06-22 in 1.69 sec.
2025-11-14 15:27:12,649 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2023-06-22' --> 'data\processed_data\ACN\10-Q_2023-06-22.md'


2025-11-14 15:27:12,921 - INFO - Going to convert document batch...
2025-11-14 15:27:12,922 - INFO - Processing document 10-Q_2023-12-19
2025-11-14 15:27:13,498 - INFO - Finished converting document 10-Q_2023-12-19 in 0.89 sec.
2025-11-14 15:27:13,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2023-12-19' --> 'data\processed_data\ACN\10-Q_2023-12-19.md'


2025-11-14 15:27:14,541 - INFO - Going to convert document batch...
2025-11-14 15:27:14,542 - INFO - Processing document 10-Q_2024-03-21
2025-11-14 15:27:15,318 - INFO - Finished converting document 10-Q_2024-03-21 in 1.50 sec.
2025-11-14 15:27:15,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2024-03-21' --> 'data\processed_data\ACN\10-Q_2024-03-21.md'


2025-11-14 15:27:16,104 - INFO - Going to convert document batch...
2025-11-14 15:27:16,105 - INFO - Processing document 10-Q_2024-06-20
2025-11-14 15:27:17,180 - INFO - Finished converting document 10-Q_2024-06-20 in 1.44 sec.
2025-11-14 15:27:17,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2024-06-20' --> 'data\processed_data\ACN\10-Q_2024-06-20.md'


2025-11-14 15:27:17,877 - INFO - Going to convert document batch...
2025-11-14 15:27:17,878 - INFO - Processing document 10-Q_2024-12-19
2025-11-14 15:27:18,477 - INFO - Finished converting document 10-Q_2024-12-19 in 0.89 sec.
2025-11-14 15:27:18,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2024-12-19' --> 'data\processed_data\ACN\10-Q_2024-12-19.md'


2025-11-14 15:27:19,183 - INFO - Going to convert document batch...
2025-11-14 15:27:19,183 - INFO - Processing document 10-Q_2025-03-20
2025-11-14 15:27:20,359 - INFO - Finished converting document 10-Q_2025-03-20 in 1.56 sec.
2025-11-14 15:27:20,816 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2025-03-20' --> 'data\processed_data\ACN\10-Q_2025-03-20.md'


2025-11-14 15:27:21,162 - INFO - Going to convert document batch...
2025-11-14 15:27:21,163 - INFO - Processing document 10-Q_2025-06-20
2025-11-14 15:27:21,934 - INFO - Finished converting document 10-Q_2025-06-20 in 1.16 sec.
2025-11-14 15:27:22,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,376 - INFO - Going to convert document batch...
2025-11-14 15:27:22,377 - INFO - Processing document 4_2023-01-04
2025-11-14 15:27:22,397 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 15:27:22,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,445 - INFO - Going to convert document batch...
2025-11-14 15:27:22,448 - INFO - Processing document 4_2023-01-09
2025-11-14 15:27:22,472 - INFO - Finished converting document 4_2023-01-09 in 0.05 sec.
2025-11-14 15:27:22,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,516 - INFO - Going to convert document batch...
2025-11-14 15:27:22,

Converted 'data\edgar_documents\ACN\10-Q_2025-06-20' --> 'data\processed_data\ACN\10-Q_2025-06-20.md'
Converted 'data\edgar_documents\ACN\4_2023-01-04' --> 'data\processed_data\ACN\4_2023-01-04.md'
Converted 'data\edgar_documents\ACN\4_2023-01-09' --> 'data\processed_data\ACN\4_2023-01-09.md'


2025-11-14 15:27:22,539 - INFO - Finished converting document 4_2023-01-17 in 0.05 sec.
2025-11-14 15:27:22,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,585 - INFO - Going to convert document batch...
2025-11-14 15:27:22,586 - INFO - Processing document 4_2023-01-18
2025-11-14 15:27:22,612 - INFO - Finished converting document 4_2023-01-18 in 0.05 sec.
2025-11-14 15:27:22,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,662 - INFO - Going to convert document batch...
2025-11-14 15:27:22,663 - INFO - Processing document 4_2023-01-23
2025-11-14 15:27:22,691 - INFO - Finished converting document 4_2023-01-23 in 0.05 sec.
2025-11-14 15:27:22,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,741 - INFO - Going to convert document batch...
2025-11-14 15:27:22,742 - INFO - Processing document 4_2023-01-24


Converted 'data\edgar_documents\ACN\4_2023-01-17' --> 'data\processed_data\ACN\4_2023-01-17.md'
Converted 'data\edgar_documents\ACN\4_2023-01-18' --> 'data\processed_data\ACN\4_2023-01-18.md'
Converted 'data\edgar_documents\ACN\4_2023-01-23' --> 'data\processed_data\ACN\4_2023-01-23.md'


2025-11-14 15:27:22,766 - INFO - Finished converting document 4_2023-01-24 in 0.05 sec.
2025-11-14 15:27:22,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,817 - INFO - Going to convert document batch...
2025-11-14 15:27:22,818 - INFO - Processing document 4_2023-01-30
2025-11-14 15:27:22,835 - INFO - Finished converting document 4_2023-01-30 in 0.03 sec.
2025-11-14 15:27:22,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,873 - INFO - Going to convert document batch...
2025-11-14 15:27:22,873 - INFO - Processing document 4_2023-02-02
2025-11-14 15:27:22,928 - INFO - Finished converting document 4_2023-02-02 in 0.08 sec.
2025-11-14 15:27:22,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,971 - INFO - Going to convert document batch...
2025-11-14 15:27:22,972 - INFO - Processing document 4_2023-02-03


Converted 'data\edgar_documents\ACN\4_2023-01-24' --> 'data\processed_data\ACN\4_2023-01-24.md'
Converted 'data\edgar_documents\ACN\4_2023-01-30' --> 'data\processed_data\ACN\4_2023-01-30.md'
Converted 'data\edgar_documents\ACN\4_2023-02-02' --> 'data\processed_data\ACN\4_2023-02-02.md'


2025-11-14 15:27:22,992 - INFO - Finished converting document 4_2023-02-03 in 0.03 sec.
2025-11-14 15:27:23,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,033 - INFO - Going to convert document batch...
2025-11-14 15:27:23,034 - INFO - Processing document 4_2023-02-06
2025-11-14 15:27:23,055 - INFO - Finished converting document 4_2023-02-06 in 0.03 sec.
2025-11-14 15:27:23,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,097 - INFO - Going to convert document batch...
2025-11-14 15:27:23,098 - INFO - Processing document 4_2023-02-17
2025-11-14 15:27:23,118 - INFO - Finished converting document 4_2023-02-17 in 0.03 sec.
2025-11-14 15:27:23,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,159 - INFO - Going to convert document batch...
2025-11-14 15:27:23,159 - INFO - Processing document 4_2023-03-07
2025-11-14 15:27:23,178 - INFO - Finished converting document 4_2023-03-07 in 0.03 sec.


Converted 'data\edgar_documents\ACN\4_2023-02-03' --> 'data\processed_data\ACN\4_2023-02-03.md'
Converted 'data\edgar_documents\ACN\4_2023-02-06' --> 'data\processed_data\ACN\4_2023-02-06.md'
Converted 'data\edgar_documents\ACN\4_2023-02-17' --> 'data\processed_data\ACN\4_2023-02-17.md'


2025-11-14 15:27:23,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,223 - INFO - Going to convert document batch...
2025-11-14 15:27:23,224 - INFO - Processing document 4_2023-03-30
2025-11-14 15:27:23,246 - INFO - Finished converting document 4_2023-03-30 in 0.05 sec.
2025-11-14 15:27:23,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,295 - INFO - Going to convert document batch...
2025-11-14 15:27:23,296 - INFO - Processing document 4_2023-04-06
2025-11-14 15:27:23,319 - INFO - Finished converting document 4_2023-04-06 in 0.05 sec.
2025-11-14 15:27:23,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,368 - INFO - Going to convert document batch...
2025-11-14 15:27:23,370 - INFO - Processing document 4_2023-04-18
2025-11-14 15:27:23,396 - INFO - Finished converting document 4_2023-04-18 in 0.05 sec.


Converted 'data\edgar_documents\ACN\4_2023-03-07' --> 'data\processed_data\ACN\4_2023-03-07.md'
Converted 'data\edgar_documents\ACN\4_2023-03-30' --> 'data\processed_data\ACN\4_2023-03-30.md'
Converted 'data\edgar_documents\ACN\4_2023-04-06' --> 'data\processed_data\ACN\4_2023-04-06.md'


2025-11-14 15:27:23,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,448 - INFO - Going to convert document batch...
2025-11-14 15:27:23,450 - INFO - Processing document 4_2023-04-24
2025-11-14 15:27:23,473 - INFO - Finished converting document 4_2023-04-24 in 0.05 sec.
2025-11-14 15:27:23,512 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,521 - INFO - Going to convert document batch...
2025-11-14 15:27:23,522 - INFO - Processing document 4_2023-04-25
2025-11-14 15:27:23,543 - INFO - Finished converting document 4_2023-04-25 in 0.05 sec.
2025-11-14 15:27:23,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,593 - INFO - Going to convert document batch...
2025-11-14 15:27:23,594 - INFO - Processing document 4_2023-05-02


Converted 'data\edgar_documents\ACN\4_2023-04-18' --> 'data\processed_data\ACN\4_2023-04-18.md'
Converted 'data\edgar_documents\ACN\4_2023-04-24' --> 'data\processed_data\ACN\4_2023-04-24.md'
Converted 'data\edgar_documents\ACN\4_2023-04-25' --> 'data\processed_data\ACN\4_2023-04-25.md'


2025-11-14 15:27:23,612 - INFO - Finished converting document 4_2023-05-02 in 0.03 sec.
2025-11-14 15:27:23,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,660 - INFO - Going to convert document batch...
2025-11-14 15:27:23,661 - INFO - Processing document 4_2023-05-08
2025-11-14 15:27:23,683 - INFO - Finished converting document 4_2023-05-08 in 0.05 sec.
2025-11-14 15:27:23,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,746 - INFO - Going to convert document batch...
2025-11-14 15:27:23,747 - INFO - Processing document 4_2023-05-16
2025-11-14 15:27:23,765 - INFO - Finished converting document 4_2023-05-16 in 0.06 sec.
2025-11-14 15:27:23,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,814 - INFO - Going to convert document batch...
2025-11-14 15:27:23,815 - INFO - Processing document 4_2023-06-06
2025-11-14 15:27:23,836 - INFO - Finished converting document 4_2023-06-06 in 0.03 sec.


Converted 'data\edgar_documents\ACN\4_2023-05-02' --> 'data\processed_data\ACN\4_2023-05-02.md'
Converted 'data\edgar_documents\ACN\4_2023-05-08' --> 'data\processed_data\ACN\4_2023-05-08.md'
Converted 'data\edgar_documents\ACN\4_2023-05-16' --> 'data\processed_data\ACN\4_2023-05-16.md'


2025-11-14 15:27:23,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,882 - INFO - Going to convert document batch...
2025-11-14 15:27:23,883 - INFO - Processing document 4_2023-06-27
2025-11-14 15:27:23,904 - INFO - Finished converting document 4_2023-06-27 in 0.05 sec.
2025-11-14 15:27:23,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,950 - INFO - Going to convert document batch...
2025-11-14 15:27:23,951 - INFO - Processing document 4_2023-07-06
2025-11-14 15:27:23,971 - INFO - Finished converting document 4_2023-07-06 in 0.05 sec.
2025-11-14 15:27:24,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,023 - INFO - Going to convert document batch...
2025-11-14 15:27:24,024 - INFO - Processing document 4_2023-07-17
2025-11-14 15:27:24,050 - INFO - Finished converting document 4_2023-07-17 in 0.05 sec.


Converted 'data\edgar_documents\ACN\4_2023-06-06' --> 'data\processed_data\ACN\4_2023-06-06.md'
Converted 'data\edgar_documents\ACN\4_2023-06-27' --> 'data\processed_data\ACN\4_2023-06-27.md'
Converted 'data\edgar_documents\ACN\4_2023-07-06' --> 'data\processed_data\ACN\4_2023-07-06.md'


2025-11-14 15:27:24,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,100 - INFO - Going to convert document batch...
2025-11-14 15:27:24,100 - INFO - Processing document 4_2023-07-24
2025-11-14 15:27:24,126 - INFO - Finished converting document 4_2023-07-24 in 0.05 sec.
2025-11-14 15:27:24,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,174 - INFO - Going to convert document batch...
2025-11-14 15:27:24,175 - INFO - Processing document 4_2023-07-28
2025-11-14 15:27:24,201 - INFO - Finished converting document 4_2023-07-28 in 0.05 sec.
2025-11-14 15:27:24,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,250 - INFO - Going to convert document batch...
2025-11-14 15:27:24,251 - INFO - Processing document 4_2023-08-08


Converted 'data\edgar_documents\ACN\4_2023-07-17' --> 'data\processed_data\ACN\4_2023-07-17.md'
Converted 'data\edgar_documents\ACN\4_2023-07-24' --> 'data\processed_data\ACN\4_2023-07-24.md'
Converted 'data\edgar_documents\ACN\4_2023-07-28' --> 'data\processed_data\ACN\4_2023-07-28.md'


2025-11-14 15:27:24,624 - INFO - Finished converting document 4_2023-08-08 in 0.41 sec.
2025-11-14 15:27:24,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,696 - INFO - Going to convert document batch...
2025-11-14 15:27:24,697 - INFO - Processing document 4_2023-08-16
2025-11-14 15:27:24,715 - INFO - Finished converting document 4_2023-08-16 in 0.06 sec.
2025-11-14 15:27:24,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,756 - INFO - Going to convert document batch...
2025-11-14 15:27:24,756 - INFO - Processing document 4_2023-09-07
2025-11-14 15:27:24,775 - INFO - Finished converting document 4_2023-09-07 in 0.03 sec.
2025-11-14 15:27:24,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,822 - INFO - Going to convert document batch...
2025-11-14 15:27:24,822 - INFO - Processing document 4_2023-09-14


Converted 'data\edgar_documents\ACN\4_2023-08-08' --> 'data\processed_data\ACN\4_2023-08-08.md'
Converted 'data\edgar_documents\ACN\4_2023-08-16' --> 'data\processed_data\ACN\4_2023-08-16.md'
Converted 'data\edgar_documents\ACN\4_2023-09-07' --> 'data\processed_data\ACN\4_2023-09-07.md'


2025-11-14 15:27:24,845 - INFO - Finished converting document 4_2023-09-14 in 0.05 sec.
2025-11-14 15:27:24,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,898 - INFO - Going to convert document batch...
2025-11-14 15:27:24,899 - INFO - Processing document 4_2023-10-10
2025-11-14 15:27:24,918 - INFO - Finished converting document 4_2023-10-10 in 0.06 sec.
2025-11-14 15:27:24,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,963 - INFO - Going to convert document batch...
2025-11-14 15:27:24,964 - INFO - Processing document 4_2023-10-16
2025-11-14 15:27:24,991 - INFO - Finished converting document 4_2023-10-16 in 0.05 sec.
2025-11-14 15:27:25,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,042 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2023-09-14' --> 'data\processed_data\ACN\4_2023-09-14.md'
Converted 'data\edgar_documents\ACN\4_2023-10-10' --> 'data\processed_data\ACN\4_2023-10-10.md'
Converted 'data\edgar_documents\ACN\4_2023-10-16' --> 'data\processed_data\ACN\4_2023-10-16.md'


2025-11-14 15:27:25,043 - INFO - Processing document 4_2023-10-20
2025-11-14 15:27:25,065 - INFO - Finished converting document 4_2023-10-20 in 0.05 sec.
2025-11-14 15:27:25,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,122 - INFO - Going to convert document batch...
2025-11-14 15:27:25,122 - INFO - Processing document 4_2023-10-23
2025-11-14 15:27:25,151 - INFO - Finished converting document 4_2023-10-23 in 0.06 sec.
2025-11-14 15:27:25,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,200 - INFO - Going to convert document batch...
2025-11-14 15:27:25,200 - INFO - Processing document 4_2023-10-24
2025-11-14 15:27:25,225 - INFO - Finished converting document 4_2023-10-24 in 0.05 sec.
2025-11-14 15:27:25,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2023-10-20' --> 'data\processed_data\ACN\4_2023-10-20.md'
Converted 'data\edgar_documents\ACN\4_2023-10-23' --> 'data\processed_data\ACN\4_2023-10-23.md'
Converted 'data\edgar_documents\ACN\4_2023-10-24' --> 'data\processed_data\ACN\4_2023-10-24.md'


2025-11-14 15:27:25,300 - INFO - Going to convert document batch...
2025-11-14 15:27:25,302 - INFO - Processing document 4_2023-10-25
2025-11-14 15:27:25,326 - INFO - Finished converting document 4_2023-10-25 in 0.08 sec.
2025-11-14 15:27:25,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,377 - INFO - Going to convert document batch...
2025-11-14 15:27:25,377 - INFO - Processing document 4_2023-10-31
2025-11-14 15:27:25,400 - INFO - Finished converting document 4_2023-10-31 in 0.05 sec.
2025-11-14 15:27:25,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,442 - INFO - Going to convert document batch...
2025-11-14 15:27:25,443 - INFO - Processing document 4_2023-11-02
2025-11-14 15:27:25,485 - INFO - Finished converting document 4_2023-11-02 in 0.06 sec.
2025-11-14 15:27:25,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,532 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2023-10-25' --> 'data\processed_data\ACN\4_2023-10-25.md'
Converted 'data\edgar_documents\ACN\4_2023-10-31' --> 'data\processed_data\ACN\4_2023-10-31.md'
Converted 'data\edgar_documents\ACN\4_2023-11-02' --> 'data\processed_data\ACN\4_2023-11-02.md'


2025-11-14 15:27:25,533 - INFO - Processing document 4_2023-11-06
2025-11-14 15:27:25,553 - INFO - Finished converting document 4_2023-11-06 in 0.03 sec.
2025-11-14 15:27:25,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,600 - INFO - Going to convert document batch...
2025-11-14 15:27:25,601 - INFO - Processing document 4_2023-11-13
2025-11-14 15:27:25,627 - INFO - Finished converting document 4_2023-11-13 in 0.05 sec.
2025-11-14 15:27:25,667 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,675 - INFO - Going to convert document batch...
2025-11-14 15:27:25,675 - INFO - Processing document 4_2023-11-16
2025-11-14 15:27:25,697 - INFO - Finished converting document 4_2023-11-16 in 0.03 sec.
2025-11-14 15:27:25,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,738 - INFO - Going to convert document batch...
2025-11-14 15:27:25,739 - INFO - Processing document 4_2023-12-06
2025-11-14 15:27:25,757 - IN

Converted 'data\edgar_documents\ACN\4_2023-11-06' --> 'data\processed_data\ACN\4_2023-11-06.md'
Converted 'data\edgar_documents\ACN\4_2023-11-13' --> 'data\processed_data\ACN\4_2023-11-13.md'
Converted 'data\edgar_documents\ACN\4_2023-11-16' --> 'data\processed_data\ACN\4_2023-11-16.md'


2025-11-14 15:27:25,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,814 - INFO - Going to convert document batch...
2025-11-14 15:27:25,816 - INFO - Processing document 4_2023-12-26
2025-11-14 15:27:25,842 - INFO - Finished converting document 4_2023-12-26 in 0.06 sec.
2025-11-14 15:27:25,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,887 - INFO - Going to convert document batch...
2025-11-14 15:27:25,888 - INFO - Processing document 4_2023-12-28
2025-11-14 15:27:25,908 - INFO - Finished converting document 4_2023-12-28 in 0.05 sec.
2025-11-14 15:27:25,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,955 - INFO - Going to convert document batch...
2025-11-14 15:27:25,955 - INFO - Processing document 4_2024-01-03


Converted 'data\edgar_documents\ACN\4_2023-12-06' --> 'data\processed_data\ACN\4_2023-12-06.md'
Converted 'data\edgar_documents\ACN\4_2023-12-26' --> 'data\processed_data\ACN\4_2023-12-26.md'
Converted 'data\edgar_documents\ACN\4_2023-12-28' --> 'data\processed_data\ACN\4_2023-12-28.md'


2025-11-14 15:27:25,975 - INFO - Finished converting document 4_2024-01-03 in 0.03 sec.
2025-11-14 15:27:26,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,020 - INFO - Going to convert document batch...
2025-11-14 15:27:26,021 - INFO - Processing document 4_2024-01-08
2025-11-14 15:27:26,041 - INFO - Finished converting document 4_2024-01-08 in 0.03 sec.
2025-11-14 15:27:26,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,084 - INFO - Going to convert document batch...
2025-11-14 15:27:26,086 - INFO - Processing document 4_2024-01-22
2025-11-14 15:27:26,115 - INFO - Finished converting document 4_2024-01-22 in 0.05 sec.
2025-11-14 15:27:26,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,160 - INFO - Going to convert document batch...
2025-11-14 15:27:26,161 - INFO - Processing document 4_2024-01-29
2025-11-14 15:27:26,185 - INFO - Finished converting document 4_2024-01-29 in 0.05 sec.


Converted 'data\edgar_documents\ACN\4_2024-01-03' --> 'data\processed_data\ACN\4_2024-01-03.md'
Converted 'data\edgar_documents\ACN\4_2024-01-08' --> 'data\processed_data\ACN\4_2024-01-08.md'
Converted 'data\edgar_documents\ACN\4_2024-01-22' --> 'data\processed_data\ACN\4_2024-01-22.md'


2025-11-14 15:27:26,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,235 - INFO - Going to convert document batch...
2025-11-14 15:27:26,236 - INFO - Processing document 4_2024-01-30
2025-11-14 15:27:26,257 - INFO - Finished converting document 4_2024-01-30 in 0.05 sec.
2025-11-14 15:27:26,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,309 - INFO - Going to convert document batch...
2025-11-14 15:27:26,310 - INFO - Processing document 4_2024-02-01
2025-11-14 15:27:26,330 - INFO - Finished converting document 4_2024-02-01 in 0.05 sec.
2025-11-14 15:27:26,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,373 - INFO - Going to convert document batch...
2025-11-14 15:27:26,374 - INFO - Processing document 4_2024-02-05


Converted 'data\edgar_documents\ACN\4_2024-01-29' --> 'data\processed_data\ACN\4_2024-01-29.md'
Converted 'data\edgar_documents\ACN\4_2024-01-30' --> 'data\processed_data\ACN\4_2024-01-30.md'
Converted 'data\edgar_documents\ACN\4_2024-02-01' --> 'data\processed_data\ACN\4_2024-02-01.md'


2025-11-14 15:27:26,395 - INFO - Finished converting document 4_2024-02-05 in 0.05 sec.
2025-11-14 15:27:26,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,441 - INFO - Going to convert document batch...
2025-11-14 15:27:26,442 - INFO - Processing document 4_2024-02-06
2025-11-14 15:27:26,464 - INFO - Finished converting document 4_2024-02-06 in 0.05 sec.
2025-11-14 15:27:26,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,524 - INFO - Going to convert document batch...
2025-11-14 15:27:26,525 - INFO - Processing document 4_2024-02-12
2025-11-14 15:27:26,544 - INFO - Finished converting document 4_2024-02-12 in 0.06 sec.
2025-11-14 15:27:26,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,608 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2024-02-05' --> 'data\processed_data\ACN\4_2024-02-05.md'
Converted 'data\edgar_documents\ACN\4_2024-02-06' --> 'data\processed_data\ACN\4_2024-02-06.md'
Converted 'data\edgar_documents\ACN\4_2024-02-12' --> 'data\processed_data\ACN\4_2024-02-12.md'


2025-11-14 15:27:26,608 - INFO - Processing document 4_2024-02-20
2025-11-14 15:27:26,630 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.
2025-11-14 15:27:26,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,672 - INFO - Going to convert document batch...
2025-11-14 15:27:26,673 - INFO - Processing document 4_2024-03-07
2025-11-14 15:27:26,692 - INFO - Finished converting document 4_2024-03-07 in 0.03 sec.
2025-11-14 15:27:26,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,754 - INFO - Going to convert document batch...
2025-11-14 15:27:26,755 - INFO - Processing document 4_2024-03-26
2025-11-14 15:27:26,783 - INFO - Finished converting document 4_2024-03-26 in 0.08 sec.
2025-11-14 15:27:26,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2024-02-20' --> 'data\processed_data\ACN\4_2024-02-20.md'
Converted 'data\edgar_documents\ACN\4_2024-03-07' --> 'data\processed_data\ACN\4_2024-03-07.md'
Converted 'data\edgar_documents\ACN\4_2024-03-26' --> 'data\processed_data\ACN\4_2024-03-26.md'


2025-11-14 15:27:26,851 - INFO - Going to convert document batch...
2025-11-14 15:27:26,851 - INFO - Processing document 4_2024-04-08
2025-11-14 15:27:26,872 - INFO - Finished converting document 4_2024-04-08 in 0.06 sec.
2025-11-14 15:27:26,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,918 - INFO - Going to convert document batch...
2025-11-14 15:27:26,918 - INFO - Processing document 4_2024-04-16
2025-11-14 15:27:26,945 - INFO - Finished converting document 4_2024-04-16 in 0.05 sec.
2025-11-14 15:27:26,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,994 - INFO - Going to convert document batch...
2025-11-14 15:27:26,996 - INFO - Processing document 4_2024-04-22
2025-11-14 15:27:27,022 - INFO - Finished converting document 4_2024-04-22 in 0.05 sec.
2025-11-14 15:27:27,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,068 - INFO - Going to convert document batch...
2025-11-14 15:27:27,069 - 

Converted 'data\edgar_documents\ACN\4_2024-04-08' --> 'data\processed_data\ACN\4_2024-04-08.md'
Converted 'data\edgar_documents\ACN\4_2024-04-16' --> 'data\processed_data\ACN\4_2024-04-16.md'
Converted 'data\edgar_documents\ACN\4_2024-04-22' --> 'data\processed_data\ACN\4_2024-04-22.md'


2025-11-14 15:27:27,093 - INFO - Finished converting document 4_2024-04-26 in 0.05 sec.
2025-11-14 15:27:27,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,144 - INFO - Going to convert document batch...
2025-11-14 15:27:27,145 - INFO - Processing document 4_2024-05-03
2025-11-14 15:27:27,165 - INFO - Finished converting document 4_2024-05-03 in 0.03 sec.
2025-11-14 15:27:27,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,206 - INFO - Going to convert document batch...
2025-11-14 15:27:27,207 - INFO - Processing document 4_2024-05-06
2025-11-14 15:27:27,225 - INFO - Finished converting document 4_2024-05-06 in 0.03 sec.
2025-11-14 15:27:27,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,293 - INFO - Going to convert document batch...
2025-11-14 15:27:27,295 - INFO - Processing document 4_2024-05-14
2025-11-14 15:27:27,321 - INFO - Finished converting document 4_2024-05-14 in 0.06 sec.


Converted 'data\edgar_documents\ACN\4_2024-04-26' --> 'data\processed_data\ACN\4_2024-04-26.md'
Converted 'data\edgar_documents\ACN\4_2024-05-03' --> 'data\processed_data\ACN\4_2024-05-03.md'
Converted 'data\edgar_documents\ACN\4_2024-05-06' --> 'data\processed_data\ACN\4_2024-05-06.md'


2025-11-14 15:27:27,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,366 - INFO - Going to convert document batch...
2025-11-14 15:27:27,367 - INFO - Processing document 4_2024-05-17
2025-11-14 15:27:27,386 - INFO - Finished converting document 4_2024-05-17 in 0.05 sec.
2025-11-14 15:27:27,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,442 - INFO - Going to convert document batch...
2025-11-14 15:27:27,443 - INFO - Processing document 4_2024-06-06
2025-11-14 15:27:27,463 - INFO - Finished converting document 4_2024-06-06 in 0.06 sec.
2025-11-14 15:27:27,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,507 - INFO - Going to convert document batch...
2025-11-14 15:27:27,508 - INFO - Processing document 4_2024-07-08
2025-11-14 15:27:27,533 - INFO - Finished converting document 4_2024-07-08 in 0.05 sec.


Converted 'data\edgar_documents\ACN\4_2024-05-14' --> 'data\processed_data\ACN\4_2024-05-14.md'
Converted 'data\edgar_documents\ACN\4_2024-05-17' --> 'data\processed_data\ACN\4_2024-05-17.md'
Converted 'data\edgar_documents\ACN\4_2024-06-06' --> 'data\processed_data\ACN\4_2024-06-06.md'


2025-11-14 15:27:27,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,574 - INFO - Going to convert document batch...
2025-11-14 15:27:27,576 - INFO - Processing document 4_2024-07-15
2025-11-14 15:27:27,606 - INFO - Finished converting document 4_2024-07-15 in 0.06 sec.
2025-11-14 15:27:27,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,648 - INFO - Going to convert document batch...
2025-11-14 15:27:27,649 - INFO - Processing document 4_2024-07-23
2025-11-14 15:27:27,672 - INFO - Finished converting document 4_2024-07-23 in 0.05 sec.
2025-11-14 15:27:27,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,717 - INFO - Going to convert document batch...
2025-11-14 15:27:27,718 - INFO - Processing document 4_2024-07-24


Converted 'data\edgar_documents\ACN\4_2024-07-08' --> 'data\processed_data\ACN\4_2024-07-08.md'
Converted 'data\edgar_documents\ACN\4_2024-07-15' --> 'data\processed_data\ACN\4_2024-07-15.md'
Converted 'data\edgar_documents\ACN\4_2024-07-23' --> 'data\processed_data\ACN\4_2024-07-23.md'


2025-11-14 15:27:27,742 - INFO - Finished converting document 4_2024-07-24 in 0.05 sec.
2025-11-14 15:27:27,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,818 - INFO - Going to convert document batch...
2025-11-14 15:27:27,820 - INFO - Processing document 4_2024-08-06
2025-11-14 15:27:27,847 - INFO - Finished converting document 4_2024-08-06 in 0.06 sec.
2025-11-14 15:27:27,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,889 - INFO - Going to convert document batch...
2025-11-14 15:27:27,890 - INFO - Processing document 4_2024-08-16
2025-11-14 15:27:27,910 - INFO - Finished converting document 4_2024-08-16 in 0.03 sec.
2025-11-14 15:27:27,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,970 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2024-07-24' --> 'data\processed_data\ACN\4_2024-07-24.md'
Converted 'data\edgar_documents\ACN\4_2024-08-06' --> 'data\processed_data\ACN\4_2024-08-06.md'
Converted 'data\edgar_documents\ACN\4_2024-08-16' --> 'data\processed_data\ACN\4_2024-08-16.md'


2025-11-14 15:27:27,971 - INFO - Processing document 4_2024-09-06
2025-11-14 15:27:27,990 - INFO - Finished converting document 4_2024-09-06 in 0.05 sec.
2025-11-14 15:27:28,040 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:27:28,040 - ERROR - Input document 4_2024-10-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:27:28,042 - INFO - Going to convert document batch...
2025-11-14 15:27:28,102 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\ACN\4_2024-09-06' --> 'data\processed_data\ACN\4_2024-09-06.md'
Error processing data\edgar_documents\ACN\4_2024-10-01: File format not allowed: data\edgar_documents\ACN\4_2024-10-01
Error processing data\edgar_documents\ACN\4_2024-10-03: File format not allowed: data\edgar_documents\ACN\4_2024-10-03
Converted 'data\edgar_documents\ACN\4_2024-10-07' --> 'data\processed_data\ACN\4_2024-10-07.md'


2025-11-14 15:27:28,251 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,261 - INFO - Going to convert document batch...
2025-11-14 15:27:28,262 - INFO - Processing document 4_2024-10-18
2025-11-14 15:27:28,286 - INFO - Finished converting document 4_2024-10-18 in 0.05 sec.
2025-11-14 15:27:28,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,336 - INFO - Going to convert document batch...
2025-11-14 15:27:28,337 - INFO - Processing document 4_2024-10-22
2025-11-14 15:27:28,360 - INFO - Finished converting document 4_2024-10-22 in 0.05 sec.
2025-11-14 15:27:28,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,420 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2024-10-16' --> 'data\processed_data\ACN\4_2024-10-16.md'
Converted 'data\edgar_documents\ACN\4_2024-10-18' --> 'data\processed_data\ACN\4_2024-10-18.md'
Converted 'data\edgar_documents\ACN\4_2024-10-22' --> 'data\processed_data\ACN\4_2024-10-22.md'


2025-11-14 15:27:28,421 - INFO - Processing document 4_2024-10-23
2025-11-14 15:27:28,455 - INFO - Finished converting document 4_2024-10-23 in 0.08 sec.
2025-11-14 15:27:28,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,503 - INFO - Going to convert document batch...
2025-11-14 15:27:28,503 - INFO - Processing document 4_2024-10-24
2025-11-14 15:27:28,526 - INFO - Finished converting document 4_2024-10-24 in 0.05 sec.
2025-11-14 15:27:28,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,575 - INFO - Going to convert document batch...
2025-11-14 15:27:28,576 - INFO - Processing document 4_2024-10-29
2025-11-14 15:27:28,604 - INFO - Finished converting document 4_2024-10-29 in 0.06 sec.
2025-11-14 15:27:28,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,658 - INFO - Going to convert document batch...
2025-11-14 15:27:28,658 - INFO - Processing document 4_2024-11-05
2025-11-14 15:27:28,686 - IN

Converted 'data\edgar_documents\ACN\4_2024-10-23' --> 'data\processed_data\ACN\4_2024-10-23.md'
Converted 'data\edgar_documents\ACN\4_2024-10-24' --> 'data\processed_data\ACN\4_2024-10-24.md'
Converted 'data\edgar_documents\ACN\4_2024-10-29' --> 'data\processed_data\ACN\4_2024-10-29.md'


2025-11-14 15:27:28,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,733 - INFO - Going to convert document batch...
2025-11-14 15:27:28,734 - INFO - Processing document 4_2024-11-06
2025-11-14 15:27:28,753 - INFO - Finished converting document 4_2024-11-06 in 0.03 sec.
2025-11-14 15:27:28,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,797 - INFO - Going to convert document batch...
2025-11-14 15:27:28,798 - INFO - Processing document 4_2024-11-19
2025-11-14 15:27:28,819 - INFO - Finished converting document 4_2024-11-19 in 0.05 sec.
2025-11-14 15:27:28,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,860 - INFO - Going to convert document batch...
2025-11-14 15:27:28,862 - INFO - Processing document 4_2024-12-03
2025-11-14 15:27:28,882 - INFO - Finished converting document 4_2024-12-03 in 0.03 sec.
2025-11-14 15:27:28,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2024-11-05' --> 'data\processed_data\ACN\4_2024-11-05.md'
Converted 'data\edgar_documents\ACN\4_2024-11-06' --> 'data\processed_data\ACN\4_2024-11-06.md'
Converted 'data\edgar_documents\ACN\4_2024-11-19' --> 'data\processed_data\ACN\4_2024-11-19.md'
Converted 'data\edgar_documents\ACN\4_2024-12-03' --> 'data\processed_data\ACN\4_2024-12-03.md'


2025-11-14 15:27:28,940 - INFO - Going to convert document batch...
2025-11-14 15:27:28,941 - INFO - Processing document 4_2024-12-06
2025-11-14 15:27:28,963 - INFO - Finished converting document 4_2024-12-06 in 0.06 sec.
2025-11-14 15:27:29,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2024-12-06' --> 'data\processed_data\ACN\4_2024-12-06.md'


2025-11-14 15:27:29,251 - INFO - Going to convert document batch...
2025-11-14 15:27:29,251 - INFO - Processing document 4_2024-12-23
2025-11-14 15:27:29,273 - INFO - Finished converting document 4_2024-12-23 in 0.28 sec.
2025-11-14 15:27:29,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,326 - INFO - Going to convert document batch...
2025-11-14 15:27:29,328 - INFO - Processing document 4_2025-01-03
2025-11-14 15:27:29,348 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 15:27:29,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,389 - INFO - Going to convert document batch...
2025-11-14 15:27:29,390 - INFO - Processing document 4_2025-01-06
2025-11-14 15:27:29,413 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 15:27:29,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,475 - INFO - Going to convert document batch...
2025-11-14 15:27:29,476 - 

Converted 'data\edgar_documents\ACN\4_2024-12-23' --> 'data\processed_data\ACN\4_2024-12-23.md'
Converted 'data\edgar_documents\ACN\4_2025-01-03' --> 'data\processed_data\ACN\4_2025-01-03.md'
Converted 'data\edgar_documents\ACN\4_2025-01-06' --> 'data\processed_data\ACN\4_2025-01-06.md'


2025-11-14 15:27:29,501 - INFO - Finished converting document 4_2025-01-21 in 0.06 sec.
2025-11-14 15:27:29,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,555 - INFO - Going to convert document batch...
2025-11-14 15:27:29,555 - INFO - Processing document 4_2025-01-22
2025-11-14 15:27:29,585 - INFO - Finished converting document 4_2025-01-22 in 0.05 sec.
2025-11-14 15:27:29,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,635 - INFO - Going to convert document batch...
2025-11-14 15:27:29,636 - INFO - Processing document 4_2025-01-27
2025-11-14 15:27:29,662 - INFO - Finished converting document 4_2025-01-27 in 0.05 sec.
2025-11-14 15:27:29,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,709 - INFO - Going to convert document batch...
2025-11-14 15:27:29,711 - INFO - Processing document 4_2025-02-04


Converted 'data\edgar_documents\ACN\4_2025-01-21' --> 'data\processed_data\ACN\4_2025-01-21.md'
Converted 'data\edgar_documents\ACN\4_2025-01-22' --> 'data\processed_data\ACN\4_2025-01-22.md'
Converted 'data\edgar_documents\ACN\4_2025-01-27' --> 'data\processed_data\ACN\4_2025-01-27.md'


2025-11-14 15:27:29,731 - INFO - Finished converting document 4_2025-02-04 in 0.05 sec.
2025-11-14 15:27:29,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,781 - INFO - Going to convert document batch...
2025-11-14 15:27:29,782 - INFO - Processing document 4_2025-02-06
2025-11-14 15:27:29,816 - INFO - Finished converting document 4_2025-02-06 in 0.06 sec.
2025-11-14 15:27:29,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,864 - INFO - Going to convert document batch...
2025-11-14 15:27:29,865 - INFO - Processing document 4_2025-02-07
2025-11-14 15:27:29,885 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.
2025-11-14 15:27:29,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,928 - INFO - Going to convert document batch...
2025-11-14 15:27:29,928 - INFO - Processing document 4_2025-02-18


Converted 'data\edgar_documents\ACN\4_2025-02-04' --> 'data\processed_data\ACN\4_2025-02-04.md'
Converted 'data\edgar_documents\ACN\4_2025-02-06' --> 'data\processed_data\ACN\4_2025-02-06.md'
Converted 'data\edgar_documents\ACN\4_2025-02-07' --> 'data\processed_data\ACN\4_2025-02-07.md'


2025-11-14 15:27:29,951 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 15:27:29,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,018 - INFO - Going to convert document batch...
2025-11-14 15:27:30,019 - INFO - Processing document 4_2025-03-06
2025-11-14 15:27:30,045 - INFO - Finished converting document 4_2025-03-06 in 0.06 sec.
2025-11-14 15:27:30,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,105 - INFO - Going to convert document batch...
2025-11-14 15:27:30,106 - INFO - Processing document 4_2025-04-07
2025-11-14 15:27:30,124 - INFO - Finished converting document 4_2025-04-07 in 0.06 sec.
2025-11-14 15:27:30,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,169 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2025-02-18' --> 'data\processed_data\ACN\4_2025-02-18.md'
Converted 'data\edgar_documents\ACN\4_2025-03-06' --> 'data\processed_data\ACN\4_2025-03-06.md'
Converted 'data\edgar_documents\ACN\4_2025-04-07' --> 'data\processed_data\ACN\4_2025-04-07.md'


2025-11-14 15:27:30,170 - INFO - Processing document 4_2025-04-14
2025-11-14 15:27:30,207 - INFO - Finished converting document 4_2025-04-14 in 0.06 sec.
2025-11-14 15:27:30,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,254 - INFO - Going to convert document batch...
2025-11-14 15:27:30,255 - INFO - Processing document 4_2025-05-05
2025-11-14 15:27:30,273 - INFO - Finished converting document 4_2025-05-05 in 0.03 sec.
2025-11-14 15:27:30,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,321 - INFO - Going to convert document batch...
2025-11-14 15:27:30,322 - INFO - Processing document 4_2025-05-06
2025-11-14 15:27:30,339 - INFO - Finished converting document 4_2025-05-06 in 0.05 sec.
2025-11-14 15:27:30,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,384 - INFO - Going to convert document batch...
2025-11-14 15:27:30,384 - INFO - Processing document 4_2025-05-14
2025-11-14 15:27:30,404 - IN

Converted 'data\edgar_documents\ACN\4_2025-04-14' --> 'data\processed_data\ACN\4_2025-04-14.md'
Converted 'data\edgar_documents\ACN\4_2025-05-05' --> 'data\processed_data\ACN\4_2025-05-05.md'
Converted 'data\edgar_documents\ACN\4_2025-05-06' --> 'data\processed_data\ACN\4_2025-05-06.md'


2025-11-14 15:27:30,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,470 - INFO - Going to convert document batch...
2025-11-14 15:27:30,472 - INFO - Processing document 4_2025-05-16
2025-11-14 15:27:30,495 - INFO - Finished converting document 4_2025-05-16 in 0.08 sec.
2025-11-14 15:27:30,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,538 - INFO - Going to convert document batch...
2025-11-14 15:27:30,539 - INFO - Processing document 4_2025-06-09
2025-11-14 15:27:30,556 - INFO - Finished converting document 4_2025-06-09 in 0.03 sec.


Converted 'data\edgar_documents\ACN\4_2025-05-14' --> 'data\processed_data\ACN\4_2025-05-14.md'
Converted 'data\edgar_documents\ACN\4_2025-05-16' --> 'data\processed_data\ACN\4_2025-05-16.md'
Converted 'data\edgar_documents\ACN\4_2025-06-09' --> 'data\processed_data\ACN\4_2025-06-09.md'


2025-11-14 15:27:30,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,620 - INFO - Going to convert document batch...
2025-11-14 15:27:30,621 - INFO - Processing document 4_2025-07-07
2025-11-14 15:27:30,644 - INFO - Finished converting document 4_2025-07-07 in 0.06 sec.
2025-11-14 15:27:30,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,686 - INFO - Going to convert document batch...
2025-11-14 15:27:30,687 - INFO - Processing document 4_2025-07-14
2025-11-14 15:27:30,711 - INFO - Finished converting document 4_2025-07-14 in 0.05 sec.
2025-11-14 15:27:30,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,772 - INFO - Going to convert document batch...
2025-11-14 15:27:30,773 - INFO - Processing document 4_2025-08-06
2025-11-14 15:27:30,794 - INFO - Finished converting document 4_2025-08-06 in 0.06 sec.
2025-11-14 15:27:30,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ACN\4_2025-07-07' --> 'data\processed_data\ACN\4_2025-07-07.md'
Converted 'data\edgar_documents\ACN\4_2025-07-14' --> 'data\processed_data\ACN\4_2025-07-14.md'
Converted 'data\edgar_documents\ACN\4_2025-08-06' --> 'data\processed_data\ACN\4_2025-08-06.md'


2025-11-14 15:27:30,857 - INFO - Finished converting document 4_2025-08-18 in 0.05 sec.
2025-11-14 15:27:30,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,919 - INFO - Going to convert document batch...
2025-11-14 15:27:30,920 - INFO - Processing document 4_2025-09-08
2025-11-14 15:27:30,939 - INFO - Finished converting document 4_2025-09-08 in 0.06 sec.
2025-11-14 15:27:30,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,994 - INFO - Going to convert document batch...
2025-11-14 15:27:30,995 - INFO - Processing document 4_2025-10-06
2025-11-14 15:27:31,016 - INFO - Finished converting document 4_2025-10-06 in 0.05 sec.
2025-11-14 15:27:31,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,072 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2025-08-18' --> 'data\processed_data\ACN\4_2025-08-18.md'
Converted 'data\edgar_documents\ACN\4_2025-09-08' --> 'data\processed_data\ACN\4_2025-09-08.md'
Converted 'data\edgar_documents\ACN\4_2025-10-06' --> 'data\processed_data\ACN\4_2025-10-06.md'


2025-11-14 15:27:31,073 - INFO - Processing document 4_2025-10-22
2025-11-14 15:27:31,112 - INFO - Finished converting document 4_2025-10-22 in 0.08 sec.
2025-11-14 15:27:31,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,161 - INFO - Going to convert document batch...
2025-11-14 15:27:31,163 - INFO - Processing document 4_2025-10-23
2025-11-14 15:27:31,186 - INFO - Finished converting document 4_2025-10-23 in 0.05 sec.
2025-11-14 15:27:31,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,238 - INFO - Going to convert document batch...
2025-11-14 15:27:31,239 - INFO - Processing document 4_2025-10-30
2025-11-14 15:27:31,265 - INFO - Finished converting document 4_2025-10-30 in 0.05 sec.
2025-11-14 15:27:31,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2025-10-22' --> 'data\processed_data\ACN\4_2025-10-22.md'
Converted 'data\edgar_documents\ACN\4_2025-10-23' --> 'data\processed_data\ACN\4_2025-10-23.md'
Converted 'data\edgar_documents\ACN\4_2025-10-30' --> 'data\processed_data\ACN\4_2025-10-30.md'


2025-11-14 15:27:31,335 - INFO - Going to convert document batch...
2025-11-14 15:27:31,335 - INFO - Processing document 4_2025-11-04
2025-11-14 15:27:31,371 - INFO - Finished converting document 4_2025-11-04 in 0.08 sec.
2025-11-14 15:27:31,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,415 - INFO - Going to convert document batch...
2025-11-14 15:27:31,415 - INFO - Processing document 4_2025-11-06
2025-11-14 15:27:31,434 - INFO - Finished converting document 4_2025-11-06 in 0.05 sec.
2025-11-14 15:27:31,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,495 - INFO - Going to convert document batch...
2025-11-14 15:27:31,496 - INFO - Processing document 8-K_2023-02-01
2025-11-14 15:27:31,536 - INFO - Finished converting document 8-K_2023-02-01 in 0.08 sec.
2025-11-14 15:27:31,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,591 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2025-11-04' --> 'data\processed_data\ACN\4_2025-11-04.md'
Converted 'data\edgar_documents\ACN\4_2025-11-06' --> 'data\processed_data\ACN\4_2025-11-06.md'
Converted 'data\edgar_documents\ACN\8-K_2023-02-01' --> 'data\processed_data\ACN\8-K_2023-02-01.md'


2025-11-14 15:27:31,592 - INFO - Processing document 8-K_2023-03-23
2025-11-14 15:27:31,612 - INFO - Finished converting document 8-K_2023-03-23 in 0.06 sec.
2025-11-14 15:27:31,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,672 - INFO - Going to convert document batch...
2025-11-14 15:27:31,673 - INFO - Processing document 8-K_2023-04-14
2025-11-14 15:27:31,699 - INFO - Finished converting document 8-K_2023-04-14 in 0.08 sec.
2025-11-14 15:27:31,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,738 - INFO - Going to convert document batch...
2025-11-14 15:27:31,739 - INFO - Processing document 8-K_2023-06-22
2025-11-14 15:27:31,758 - INFO - Finished converting document 8-K_2023-06-22 in 0.05 sec.
2025-11-14 15:27:31,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,802 - INFO - Going to convert document batch...
2025-11-14 15:27:31,803 - INFO - Processing document 8-K_2023-07-27


Converted 'data\edgar_documents\ACN\8-K_2023-03-23' --> 'data\processed_data\ACN\8-K_2023-03-23.md'
Converted 'data\edgar_documents\ACN\8-K_2023-04-14' --> 'data\processed_data\ACN\8-K_2023-04-14.md'
Converted 'data\edgar_documents\ACN\8-K_2023-06-22' --> 'data\processed_data\ACN\8-K_2023-06-22.md'


2025-11-14 15:27:31,822 - INFO - Finished converting document 8-K_2023-07-27 in 0.05 sec.
2025-11-14 15:27:31,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,865 - INFO - Going to convert document batch...
2025-11-14 15:27:31,866 - INFO - Processing document 8-K_2023-09-28
2025-11-14 15:27:31,888 - INFO - Finished converting document 8-K_2023-09-28 in 0.06 sec.
2025-11-14 15:27:31,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,932 - INFO - Going to convert document batch...
2025-11-14 15:27:31,933 - INFO - Processing document 8-K_2023-12-06
2025-11-14 15:27:31,955 - INFO - Finished converting document 8-K_2023-12-06 in 0.05 sec.
2025-11-14 15:27:31,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,003 - INFO - Going to convert document batch...
2025-11-14 15:27:32,004 - INFO - Processing document 8-K_2023-12-19


Converted 'data\edgar_documents\ACN\8-K_2023-07-27' --> 'data\processed_data\ACN\8-K_2023-07-27.md'
Converted 'data\edgar_documents\ACN\8-K_2023-09-28' --> 'data\processed_data\ACN\8-K_2023-09-28.md'
Converted 'data\edgar_documents\ACN\8-K_2023-12-06' --> 'data\processed_data\ACN\8-K_2023-12-06.md'


2025-11-14 15:27:32,023 - INFO - Finished converting document 8-K_2023-12-19 in 0.05 sec.
2025-11-14 15:27:32,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,073 - INFO - Going to convert document batch...
2025-11-14 15:27:32,074 - INFO - Processing document 8-K_2024-01-31
2025-11-14 15:27:32,125 - INFO - Finished converting document 8-K_2024-01-31 in 0.09 sec.
2025-11-14 15:27:32,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,184 - INFO - Going to convert document batch...
2025-11-14 15:27:32,185 - INFO - Processing document 8-K_2024-03-21
2025-11-14 15:27:32,202 - INFO - Finished converting document 8-K_2024-03-21 in 0.05 sec.
2025-11-14 15:27:32,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\8-K_2023-12-19' --> 'data\processed_data\ACN\8-K_2023-12-19.md'
Converted 'data\edgar_documents\ACN\8-K_2024-01-31' --> 'data\processed_data\ACN\8-K_2024-01-31.md'
Converted 'data\edgar_documents\ACN\8-K_2024-03-21' --> 'data\processed_data\ACN\8-K_2024-03-21.md'


2025-11-14 15:27:32,236 - INFO - Going to convert document batch...
2025-11-14 15:27:32,237 - INFO - Processing document 8-K_2024-05-17
2025-11-14 15:27:32,255 - INFO - Finished converting document 8-K_2024-05-17 in 0.03 sec.
2025-11-14 15:27:32,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,288 - INFO - Going to convert document batch...
2025-11-14 15:27:32,289 - INFO - Processing document 8-K_2024-06-11
2025-11-14 15:27:32,309 - INFO - Finished converting document 8-K_2024-06-11 in 0.05 sec.
2025-11-14 15:27:32,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,340 - INFO - Going to convert document batch...
2025-11-14 15:27:32,340 - INFO - Processing document 8-K_2024-06-20
2025-11-14 15:27:32,358 - INFO - Finished converting document 8-K_2024-06-20 in 0.05 sec.
2025-11-14 15:27:32,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,390 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\ACN\8-K_2024-05-17' --> 'data\processed_data\ACN\8-K_2024-05-17.md'
Converted 'data\edgar_documents\ACN\8-K_2024-06-11' --> 'data\processed_data\ACN\8-K_2024-06-11.md'
Converted 'data\edgar_documents\ACN\8-K_2024-06-20' --> 'data\processed_data\ACN\8-K_2024-06-20.md'
Converted 'data\edgar_documents\ACN\8-K_2024-07-19' --> 'data\processed_data\ACN\8-K_2024-07-19.md'


2025-11-14 15:27:32,459 - INFO - Finished converting document 8-K_2024-09-26 in 0.03 sec.
2025-11-14 15:27:32,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,551 - INFO - Going to convert document batch...
2025-11-14 15:27:32,552 - INFO - Processing document 8-K_2024-09-30
2025-11-14 15:27:32,617 - INFO - Finished converting document 8-K_2024-09-30 in 0.14 sec.
2025-11-14 15:27:32,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,653 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\8-K_2024-09-26' --> 'data\processed_data\ACN\8-K_2024-09-26.md'
Converted 'data\edgar_documents\ACN\8-K_2024-09-30' --> 'data\processed_data\ACN\8-K_2024-09-30.md'


2025-11-14 15:27:32,654 - INFO - Processing document 8-K_2024-10-04
2025-11-14 15:27:32,679 - INFO - Finished converting document 8-K_2024-10-04 in 0.05 sec.
2025-11-14 15:27:32,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,715 - INFO - Going to convert document batch...
2025-11-14 15:27:32,716 - INFO - Processing document 8-K_2024-12-02
2025-11-14 15:27:32,731 - INFO - Finished converting document 8-K_2024-12-02 in 0.05 sec.
2025-11-14 15:27:32,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,762 - INFO - Going to convert document batch...
2025-11-14 15:27:32,763 - INFO - Processing document 8-K_2024-12-19
2025-11-14 15:27:32,782 - INFO - Finished converting document 8-K_2024-12-19 in 0.05 sec.
2025-11-14 15:27:32,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,830 - INFO - Going to convert document batch...
2025-11-14 15:27:32,830 - INFO - Processing document 8-K_2025-02-06
2025-11-14 15:

Converted 'data\edgar_documents\ACN\8-K_2024-10-04' --> 'data\processed_data\ACN\8-K_2024-10-04.md'
Converted 'data\edgar_documents\ACN\8-K_2024-12-02' --> 'data\processed_data\ACN\8-K_2024-12-02.md'
Converted 'data\edgar_documents\ACN\8-K_2024-12-19' --> 'data\processed_data\ACN\8-K_2024-12-19.md'


2025-11-14 15:27:32,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,912 - INFO - Going to convert document batch...
2025-11-14 15:27:32,913 - INFO - Processing document 8-K_2025-02-13
2025-11-14 15:27:32,930 - INFO - Finished converting document 8-K_2025-02-13 in 0.03 sec.
2025-11-14 15:27:32,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,961 - INFO - Going to convert document batch...
2025-11-14 15:27:32,962 - INFO - Processing document 8-K_2025-03-20
2025-11-14 15:27:32,978 - INFO - Finished converting document 8-K_2025-03-20 in 0.03 sec.
2025-11-14 15:27:33,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:33,009 - INFO - Going to convert document batch...
2025-11-14 15:27:33,010 - INFO - Processing document 8-K_2025-06-20
2025-11-14 15:27:33,030 - INFO - Finished converting document 8-K_2025-06-20 in 0.05 sec.
2025-11-14 15:27:33,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ACN\8-K_2025-02-06' --> 'data\processed_data\ACN\8-K_2025-02-06.md'
Converted 'data\edgar_documents\ACN\8-K_2025-02-13' --> 'data\processed_data\ACN\8-K_2025-02-13.md'
Converted 'data\edgar_documents\ACN\8-K_2025-03-20' --> 'data\processed_data\ACN\8-K_2025-03-20.md'
Converted 'data\edgar_documents\ACN\8-K_2025-06-20' --> 'data\processed_data\ACN\8-K_2025-06-20.md'


2025-11-14 15:27:33,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:33,118 - INFO - Going to convert document batch...
2025-11-14 15:27:33,118 - INFO - Processing document 8-K_2025-09-25
2025-11-14 15:27:33,139 - INFO - Finished converting document 8-K_2025-09-25 in 0.05 sec.
2025-11-14 15:27:33,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\8-K_2025-07-17' --> 'data\processed_data\ACN\8-K_2025-07-17.md'
Converted 'data\edgar_documents\ACN\8-K_2025-09-25' --> 'data\processed_data\ACN\8-K_2025-09-25.md'


2025-11-14 15:27:33,884 - INFO - Going to convert document batch...
2025-11-14 15:27:33,884 - INFO - Processing document DEF-14A_2023-12-13
2025-11-14 15:27:36,725 - INFO - Finished converting document DEF-14A_2023-12-13 in 3.58 sec.
2025-11-14 15:27:37,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\DEF-14A_2023-12-13' --> 'data\processed_data\ACN\DEF-14A_2023-12-13.md'


2025-11-14 15:27:38,307 - INFO - Going to convert document batch...
2025-11-14 15:27:38,308 - INFO - Processing document DEF-14A_2024-12-16
2025-11-14 15:27:41,128 - INFO - Finished converting document DEF-14A_2024-12-16 in 3.48 sec.
2025-11-14 15:27:42,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\DEF-14A_2024-12-16' --> 'data\processed_data\ACN\DEF-14A_2024-12-16.md'
Processed 151 new files. Errors: 2
Found 127 files to process in data\edgar_documents\ADBE


2025-11-14 15:27:42,910 - INFO - Going to convert document batch...
2025-11-14 15:27:42,911 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:27:42,911 - INFO - Processing document 10-K_2023-01-17
2025-11-14 15:27:44,086 - INFO - Finished converting document 10-K_2023-01-17 in 2.05 sec.
2025-11-14 15:27:44,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-K_2023-01-17' --> 'data\processed_data\ADBE\10-K_2023-01-17.md'


2025-11-14 15:27:45,446 - INFO - Going to convert document batch...
2025-11-14 15:27:45,447 - INFO - Processing document 10-K_2024-01-17
2025-11-14 15:27:46,594 - INFO - Finished converting document 10-K_2024-01-17 in 2.00 sec.
2025-11-14 15:27:47,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-K_2024-01-17' --> 'data\processed_data\ADBE\10-K_2024-01-17.md'


2025-11-14 15:27:47,973 - INFO - Going to convert document batch...
2025-11-14 15:27:47,974 - INFO - Processing document 10-K_2025-01-13
2025-11-14 15:27:49,075 - INFO - Finished converting document 10-K_2025-01-13 in 1.98 sec.
2025-11-14 15:27:49,609 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-K_2025-01-13' --> 'data\processed_data\ADBE\10-K_2025-01-13.md'


2025-11-14 15:27:49,974 - INFO - Going to convert document batch...
2025-11-14 15:27:49,975 - INFO - Processing document 10-Q_2023-03-29
2025-11-14 15:27:50,695 - INFO - Finished converting document 10-Q_2023-03-29 in 1.11 sec.
2025-11-14 15:27:51,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2023-03-29' --> 'data\processed_data\ADBE\10-Q_2023-03-29.md'


2025-11-14 15:27:51,960 - INFO - Going to convert document batch...
2025-11-14 15:27:51,961 - INFO - Processing document 10-Q_2023-06-28
2025-11-14 15:27:52,762 - INFO - Finished converting document 10-Q_2023-06-28 in 1.69 sec.
2025-11-14 15:27:53,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2023-06-28' --> 'data\processed_data\ADBE\10-Q_2023-06-28.md'


2025-11-14 15:27:53,741 - INFO - Going to convert document batch...
2025-11-14 15:27:53,742 - INFO - Processing document 10-Q_2023-09-27
2025-11-14 15:27:54,634 - INFO - Finished converting document 10-Q_2023-09-27 in 1.45 sec.
2025-11-14 15:27:55,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2023-09-27' --> 'data\processed_data\ADBE\10-Q_2023-09-27.md'


2025-11-14 15:27:55,960 - INFO - Going to convert document batch...
2025-11-14 15:27:55,960 - INFO - Processing document 10-Q_2024-03-27
2025-11-14 15:27:57,026 - INFO - Finished converting document 10-Q_2024-03-27 in 1.56 sec.
2025-11-14 15:27:57,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2024-03-27' --> 'data\processed_data\ADBE\10-Q_2024-03-27.md'


2025-11-14 15:27:58,099 - INFO - Going to convert document batch...
2025-11-14 15:27:58,100 - INFO - Processing document 10-Q_2024-06-26
2025-11-14 15:27:58,928 - INFO - Finished converting document 10-Q_2024-06-26 in 1.53 sec.
2025-11-14 15:27:59,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2024-06-26' --> 'data\processed_data\ADBE\10-Q_2024-06-26.md'


2025-11-14 15:27:59,769 - INFO - Going to convert document batch...
2025-11-14 15:27:59,770 - INFO - Processing document 10-Q_2024-09-25
2025-11-14 15:28:00,548 - INFO - Finished converting document 10-Q_2024-09-25 in 1.22 sec.
2025-11-14 15:28:00,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2024-09-25' --> 'data\processed_data\ADBE\10-Q_2024-09-25.md'


2025-11-14 15:28:01,679 - INFO - Going to convert document batch...
2025-11-14 15:28:01,680 - INFO - Processing document 10-Q_2025-03-26
2025-11-14 15:28:02,371 - INFO - Finished converting document 10-Q_2025-03-26 in 1.42 sec.
2025-11-14 15:28:02,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2025-03-26' --> 'data\processed_data\ADBE\10-Q_2025-03-26.md'


2025-11-14 15:28:03,105 - INFO - Going to convert document batch...
2025-11-14 15:28:03,106 - INFO - Processing document 10-Q_2025-06-25
2025-11-14 15:28:03,815 - INFO - Finished converting document 10-Q_2025-06-25 in 1.11 sec.
2025-11-14 15:28:04,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2025-06-25' --> 'data\processed_data\ADBE\10-Q_2025-06-25.md'


2025-11-14 15:28:04,872 - INFO - Going to convert document batch...
2025-11-14 15:28:04,872 - INFO - Processing document 10-Q_2025-09-24
2025-11-14 15:28:05,603 - INFO - Finished converting document 10-Q_2025-09-24 in 1.42 sec.
2025-11-14 15:28:05,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,008 - INFO - Going to convert document batch...
2025-11-14 15:28:06,008 - INFO - Processing document 4_2023-01-10
2025-11-14 15:28:06,029 - INFO - Finished converting document 4_2023-01-10 in 0.05 sec.
2025-11-14 15:28:06,078 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:06,079 - ERROR - Input document 4_2023-01-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, 

Converted 'data\edgar_documents\ADBE\10-Q_2025-09-24' --> 'data\processed_data\ADBE\10-Q_2025-09-24.md'
Converted 'data\edgar_documents\ADBE\4_2023-01-10' --> 'data\processed_data\ADBE\4_2023-01-10.md'
Error processing data\edgar_documents\ADBE\4_2023-01-11: File format not allowed: data\edgar_documents\ADBE\4_2023-01-11
Converted 'data\edgar_documents\ADBE\4_2023-01-12' --> 'data\processed_data\ADBE\4_2023-01-12.md'


2025-11-14 15:28:06,170 - INFO - Processing document 4_2023-01-23
2025-11-14 15:28:06,199 - INFO - Finished converting document 4_2023-01-23 in 0.06 sec.
2025-11-14 15:28:06,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,278 - INFO - Going to convert document batch...
2025-11-14 15:28:06,279 - INFO - Processing document 4_2023-01-26
2025-11-14 15:28:06,321 - INFO - Finished converting document 4_2023-01-26 in 0.09 sec.
2025-11-14 15:28:06,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,377 - INFO - Going to convert document batch...
2025-11-14 15:28:06,377 - INFO - Processing document 4_2023-02-03
2025-11-14 15:28:06,395 - INFO - Finished converting document 4_2023-02-03 in 0.03 sec.
2025-11-14 15:28:06,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2023-01-23' --> 'data\processed_data\ADBE\4_2023-01-23.md'
Converted 'data\edgar_documents\ADBE\4_2023-01-26' --> 'data\processed_data\ADBE\4_2023-01-26.md'
Converted 'data\edgar_documents\ADBE\4_2023-02-03' --> 'data\processed_data\ADBE\4_2023-02-03.md'


2025-11-14 15:28:06,437 - INFO - Going to convert document batch...
2025-11-14 15:28:06,438 - INFO - Processing document 4_2023-02-16
2025-11-14 15:28:06,462 - INFO - Finished converting document 4_2023-02-16 in 0.05 sec.
2025-11-14 15:28:06,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,504 - INFO - Going to convert document batch...
2025-11-14 15:28:06,504 - INFO - Processing document 4_2023-03-01
2025-11-14 15:28:06,526 - INFO - Finished converting document 4_2023-03-01 in 0.05 sec.
2025-11-14 15:28:06,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,566 - INFO - Going to convert document batch...
2025-11-14 15:28:06,567 - INFO - Processing document 4_2023-03-16
2025-11-14 15:28:06,590 - INFO - Finished converting document 4_2023-03-16 in 0.05 sec.
2025-11-14 15:28:06,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,633 - INFO - Going to convert document batch...
2025-11-14 15:28:06,634 - 

Converted 'data\edgar_documents\ADBE\4_2023-02-16' --> 'data\processed_data\ADBE\4_2023-02-16.md'
Converted 'data\edgar_documents\ADBE\4_2023-03-01' --> 'data\processed_data\ADBE\4_2023-03-01.md'
Converted 'data\edgar_documents\ADBE\4_2023-03-16' --> 'data\processed_data\ADBE\4_2023-03-16.md'
Converted 'data\edgar_documents\ADBE\4_2023-03-21' --> 'data\processed_data\ADBE\4_2023-03-21.md'


2025-11-14 15:28:06,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,699 - INFO - Going to convert document batch...
2025-11-14 15:28:06,700 - INFO - Processing document 4_2023-04-18
2025-11-14 15:28:06,726 - INFO - Finished converting document 4_2023-04-18 in 0.05 sec.
2025-11-14 15:28:06,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,775 - INFO - Going to convert document batch...
2025-11-14 15:28:06,776 - INFO - Processing document 4_2023-04-24
2025-11-14 15:28:06,803 - INFO - Finished converting document 4_2023-04-24 in 0.05 sec.
2025-11-14 15:28:06,843 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,851 - INFO - Going to convert document batch...
2025-11-14 15:28:06,852 - INFO - Processing document 4_2023-04-26
2025-11-14 15:28:06,872 - INFO - Finished converting document 4_2023-04-26 in 0.05 sec.
2025-11-14 15:28:06,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\4_2023-04-18' --> 'data\processed_data\ADBE\4_2023-04-18.md'
Converted 'data\edgar_documents\ADBE\4_2023-04-24' --> 'data\processed_data\ADBE\4_2023-04-24.md'
Converted 'data\edgar_documents\ADBE\4_2023-04-26' --> 'data\processed_data\ADBE\4_2023-04-26.md'


2025-11-14 15:28:06,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,986 - INFO - Going to convert document batch...
2025-11-14 15:28:06,988 - INFO - Processing document 4_2023-05-17
2025-11-14 15:28:07,009 - INFO - Finished converting document 4_2023-05-17 in 0.05 sec.
2025-11-14 15:28:07,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,072 - INFO - Going to convert document batch...
2025-11-14 15:28:07,073 - INFO - Processing document 4_2023-05-31
2025-11-14 15:28:07,108 - INFO - Finished converting document 4_2023-05-31 in 0.08 sec.


Converted 'data\edgar_documents\ADBE\4_2023-05-03' --> 'data\processed_data\ADBE\4_2023-05-03.md'
Converted 'data\edgar_documents\ADBE\4_2023-05-17' --> 'data\processed_data\ADBE\4_2023-05-17.md'


2025-11-14 15:28:07,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,171 - INFO - Going to convert document batch...
2025-11-14 15:28:07,171 - INFO - Processing document 4_2023-06-15
2025-11-14 15:28:07,197 - INFO - Finished converting document 4_2023-06-15 in 0.05 sec.
2025-11-14 15:28:07,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,265 - INFO - Going to convert document batch...
2025-11-14 15:28:07,266 - INFO - Processing document 4_2023-06-20
2025-11-14 15:28:07,292 - INFO - Finished converting document 4_2023-06-20 in 0.06 sec.
2025-11-14 15:28:07,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2023-05-31' --> 'data\processed_data\ADBE\4_2023-05-31.md'
Converted 'data\edgar_documents\ADBE\4_2023-06-15' --> 'data\processed_data\ADBE\4_2023-06-15.md'
Converted 'data\edgar_documents\ADBE\4_2023-06-20' --> 'data\processed_data\ADBE\4_2023-06-20.md'


2025-11-14 15:28:07,344 - INFO - Going to convert document batch...
2025-11-14 15:28:07,345 - INFO - Processing document 4_2023-06-22
2025-11-14 15:28:07,373 - INFO - Finished converting document 4_2023-06-22 in 0.06 sec.
2025-11-14 15:28:07,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,423 - INFO - Going to convert document batch...
2025-11-14 15:28:07,424 - INFO - Processing document 4_2023-06-23
2025-11-14 15:28:07,444 - INFO - Finished converting document 4_2023-06-23 in 0.03 sec.
2025-11-14 15:28:07,482 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,492 - INFO - Going to convert document batch...
2025-11-14 15:28:07,493 - INFO - Processing document 4_2023-07-18
2025-11-14 15:28:07,519 - INFO - Finished converting document 4_2023-07-18 in 0.05 sec.
2025-11-14 15:28:07,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,563 - INFO - Going to convert document batch...
2025-11-14 15:28:07,564 - 

Converted 'data\edgar_documents\ADBE\4_2023-06-22' --> 'data\processed_data\ADBE\4_2023-06-22.md'
Converted 'data\edgar_documents\ADBE\4_2023-06-23' --> 'data\processed_data\ADBE\4_2023-06-23.md'
Converted 'data\edgar_documents\ADBE\4_2023-07-18' --> 'data\processed_data\ADBE\4_2023-07-18.md'
Converted 'data\edgar_documents\ADBE\4_2023-07-26' --> 'data\processed_data\ADBE\4_2023-07-26.md'


2025-11-14 15:28:07,627 - INFO - Going to convert document batch...
2025-11-14 15:28:07,628 - INFO - Processing document 4_2023-08-07
2025-11-14 15:28:07,647 - INFO - Finished converting document 4_2023-08-07 in 0.03 sec.
2025-11-14 15:28:07,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,712 - INFO - Going to convert document batch...
2025-11-14 15:28:07,713 - INFO - Processing document 4_2023-08-17
2025-11-14 15:28:07,734 - INFO - Finished converting document 4_2023-08-17 in 0.06 sec.
2025-11-14 15:28:07,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,777 - INFO - Going to convert document batch...
2025-11-14 15:28:07,777 - INFO - Processing document 4_2023-09-01
2025-11-14 15:28:07,799 - INFO - Finished converting document 4_2023-09-01 in 0.05 sec.
2025-11-14 15:28:07,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,840 - INFO - Going to convert document batch...
2025-11-14 15:28:07,840 - 

Converted 'data\edgar_documents\ADBE\4_2023-08-07' --> 'data\processed_data\ADBE\4_2023-08-07.md'
Converted 'data\edgar_documents\ADBE\4_2023-08-17' --> 'data\processed_data\ADBE\4_2023-08-17.md'
Converted 'data\edgar_documents\ADBE\4_2023-09-01' --> 'data\processed_data\ADBE\4_2023-09-01.md'


2025-11-14 15:28:07,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,913 - INFO - Going to convert document batch...
2025-11-14 15:28:07,914 - INFO - Processing document 4_2023-09-19
2025-11-14 15:28:07,941 - INFO - Finished converting document 4_2023-09-19 in 0.05 sec.
2025-11-14 15:28:07,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,985 - INFO - Going to convert document batch...
2025-11-14 15:28:07,986 - INFO - Processing document 4_2023-10-17
2025-11-14 15:28:08,006 - INFO - Finished converting document 4_2023-10-17 in 0.03 sec.
2025-11-14 15:28:08,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,048 - INFO - Going to convert document batch...
2025-11-14 15:28:08,049 - INFO - Processing document 4_2023-10-26
2025-11-14 15:28:08,075 - INFO - Finished converting document 4_2023-10-26 in 0.05 sec.


Converted 'data\edgar_documents\ADBE\4_2023-09-18' --> 'data\processed_data\ADBE\4_2023-09-18.md'
Converted 'data\edgar_documents\ADBE\4_2023-09-19' --> 'data\processed_data\ADBE\4_2023-09-19.md'
Converted 'data\edgar_documents\ADBE\4_2023-10-17' --> 'data\processed_data\ADBE\4_2023-10-17.md'


2025-11-14 15:28:08,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2023-10-26' --> 'data\processed_data\ADBE\4_2023-10-26.md'


2025-11-14 15:28:08,474 - INFO - Going to convert document batch...
2025-11-14 15:28:08,475 - INFO - Processing document 4_2023-11-16
2025-11-14 15:28:08,503 - INFO - Finished converting document 4_2023-11-16 in 0.41 sec.
2025-11-14 15:28:08,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,565 - INFO - Going to convert document batch...
2025-11-14 15:28:08,566 - INFO - Processing document 4_2023-12-01
2025-11-14 15:28:08,586 - INFO - Finished converting document 4_2023-12-01 in 0.06 sec.
2025-11-14 15:28:08,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,628 - INFO - Going to convert document batch...
2025-11-14 15:28:08,629 - INFO - Processing document 4_2023-12-18
2025-11-14 15:28:08,651 - INFO - Finished converting document 4_2023-12-18 in 0.05 sec.
2025-11-14 15:28:08,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2023-11-16' --> 'data\processed_data\ADBE\4_2023-11-16.md'
Converted 'data\edgar_documents\ADBE\4_2023-12-01' --> 'data\processed_data\ADBE\4_2023-12-01.md'
Converted 'data\edgar_documents\ADBE\4_2023-12-18' --> 'data\processed_data\ADBE\4_2023-12-18.md'


2025-11-14 15:28:08,717 - INFO - Going to convert document batch...
2025-11-14 15:28:08,718 - INFO - Processing document 4_2023-12-19
2025-11-14 15:28:08,746 - INFO - Finished converting document 4_2023-12-19 in 0.08 sec.
2025-11-14 15:28:08,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,814 - INFO - Going to convert document batch...
2025-11-14 15:28:08,815 - INFO - Processing document 4_2023-12-26
2025-11-14 15:28:08,833 - INFO - Finished converting document 4_2023-12-26 in 0.06 sec.
2025-11-14 15:28:08,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,871 - INFO - Going to convert document batch...
2025-11-14 15:28:08,872 - INFO - Processing document 4_2024-01-04
2025-11-14 15:28:08,890 - INFO - Finished converting document 4_2024-01-04 in 0.05 sec.
2025-11-14 15:28:08,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,927 - INFO - Going to convert document batch...
2025-11-14 15:28:08,928 - 

Converted 'data\edgar_documents\ADBE\4_2023-12-19' --> 'data\processed_data\ADBE\4_2023-12-19.md'
Converted 'data\edgar_documents\ADBE\4_2023-12-26' --> 'data\processed_data\ADBE\4_2023-12-26.md'
Converted 'data\edgar_documents\ADBE\4_2024-01-04' --> 'data\processed_data\ADBE\4_2024-01-04.md'
Converted 'data\edgar_documents\ADBE\4_2024-01-08' --> 'data\processed_data\ADBE\4_2024-01-08.md'


2025-11-14 15:28:08,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,008 - INFO - Going to convert document batch...
2025-11-14 15:28:09,010 - INFO - Processing document 4_2024-01-17
2025-11-14 15:28:09,034 - INFO - Finished converting document 4_2024-01-17 in 0.06 sec.
2025-11-14 15:28:09,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,084 - INFO - Going to convert document batch...
2025-11-14 15:28:09,085 - INFO - Processing document 4_2024-01-26
2025-11-14 15:28:09,126 - INFO - Finished converting document 4_2024-01-26 in 0.08 sec.
2025-11-14 15:28:09,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,200 - INFO - Going to convert document batch...
2025-11-14 15:28:09,201 - INFO - Processing document 4_2024-02-15
2025-11-14 15:28:09,226 - INFO - Finished converting document 4_2024-02-15 in 0.06 sec.


Converted 'data\edgar_documents\ADBE\4_2024-01-17' --> 'data\processed_data\ADBE\4_2024-01-17.md'
Converted 'data\edgar_documents\ADBE\4_2024-01-26' --> 'data\processed_data\ADBE\4_2024-01-26.md'


2025-11-14 15:28:09,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,268 - INFO - Going to convert document batch...
2025-11-14 15:28:09,268 - INFO - Processing document 4_2024-03-18
2025-11-14 15:28:09,290 - INFO - Finished converting document 4_2024-03-18 in 0.03 sec.
2025-11-14 15:28:09,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,332 - INFO - Going to convert document batch...
2025-11-14 15:28:09,333 - INFO - Processing document 4_2024-03-19
2025-11-14 15:28:09,360 - INFO - Finished converting document 4_2024-03-19 in 0.05 sec.
2025-11-14 15:28:09,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,416 - INFO - Going to convert document batch...
2025-11-14 15:28:09,417 - INFO - Processing document 4_2024-03-28
2025-11-14 15:28:09,435 - INFO - Finished converting document 4_2024-03-28 in 0.06 sec.


Converted 'data\edgar_documents\ADBE\4_2024-02-15' --> 'data\processed_data\ADBE\4_2024-02-15.md'
Converted 'data\edgar_documents\ADBE\4_2024-03-18' --> 'data\processed_data\ADBE\4_2024-03-18.md'
Converted 'data\edgar_documents\ADBE\4_2024-03-19' --> 'data\processed_data\ADBE\4_2024-03-19.md'


2025-11-14 15:28:09,474 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:09,474 - ERROR - Input document 4_2024-04-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:28:09,476 - INFO - Going to convert document batch...
2025-11-14 15:28:09,495 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:09,496 - ERROR - Input document 4_2024-04-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\ADBE\4_2024-03-28' --> 'data\processed_data\ADBE\4_2024-03-28.md'
Error processing data\edgar_documents\ADBE\4_2024-04-01: File format not allowed: data\edgar_documents\ADBE\4_2024-04-01
Error processing data\edgar_documents\ADBE\4_2024-04-02: File format not allowed: data\edgar_documents\ADBE\4_2024-04-02
Converted 'data\edgar_documents\ADBE\4_2024-04-17' --> 'data\processed_data\ADBE\4_2024-04-17.md'
Converted 'data\edgar_documents\ADBE\4_2024-04-19' --> 'data\processed_data\ADBE\4_2024-04-19.md'


2025-11-14 15:28:09,654 - INFO - Going to convert document batch...
2025-11-14 15:28:09,655 - INFO - Processing document 4_2024-04-23
2025-11-14 15:28:09,672 - INFO - Finished converting document 4_2024-04-23 in 0.05 sec.
2025-11-14 15:28:09,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,745 - INFO - Going to convert document batch...
2025-11-14 15:28:09,747 - INFO - Processing document 4_2024-04-25
2025-11-14 15:28:09,772 - INFO - Finished converting document 4_2024-04-25 in 0.08 sec.
2025-11-14 15:28:09,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,837 - INFO - Going to convert document batch...
2025-11-14 15:28:09,838 - INFO - Processing document 4_2024-05-03
2025-11-14 15:28:09,859 - INFO - Finished converting document 4_2024-05-03 in 0.06 sec.


Converted 'data\edgar_documents\ADBE\4_2024-04-23' --> 'data\processed_data\ADBE\4_2024-04-23.md'
Converted 'data\edgar_documents\ADBE\4_2024-04-25' --> 'data\processed_data\ADBE\4_2024-04-25.md'
Converted 'data\edgar_documents\ADBE\4_2024-05-03' --> 'data\processed_data\ADBE\4_2024-05-03.md'


2025-11-14 15:28:09,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,917 - INFO - Going to convert document batch...
2025-11-14 15:28:09,917 - INFO - Processing document 4_2024-05-08
2025-11-14 15:28:09,935 - INFO - Finished converting document 4_2024-05-08 in 0.06 sec.
2025-11-14 15:28:09,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,973 - INFO - Going to convert document batch...
2025-11-14 15:28:09,974 - INFO - Processing document 4_2024-05-16
2025-11-14 15:28:09,996 - INFO - Finished converting document 4_2024-05-16 in 0.05 sec.
2025-11-14 15:28:10,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,036 - INFO - Going to convert document batch...
2025-11-14 15:28:10,037 - INFO - Processing document 4_2024-06-04
2025-11-14 15:28:10,055 - INFO - Finished converting document 4_2024-06-04 in 0.03 sec.
2025-11-14 15:28:10,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\4_2024-05-08' --> 'data\processed_data\ADBE\4_2024-05-08.md'
Converted 'data\edgar_documents\ADBE\4_2024-05-16' --> 'data\processed_data\ADBE\4_2024-05-16.md'
Converted 'data\edgar_documents\ADBE\4_2024-06-04' --> 'data\processed_data\ADBE\4_2024-06-04.md'


2025-11-14 15:28:10,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,181 - INFO - Going to convert document batch...
2025-11-14 15:28:10,182 - INFO - Processing document 4_2024-06-20
2025-11-14 15:28:10,200 - INFO - Finished converting document 4_2024-06-20 in 0.05 sec.
2025-11-14 15:28:10,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,241 - INFO - Going to convert document batch...
2025-11-14 15:28:10,242 - INFO - Processing document 4_2024-06-28
2025-11-14 15:28:10,264 - INFO - Finished converting document 4_2024-06-28 in 0.05 sec.
2025-11-14 15:28:10,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,310 - INFO - Going to convert document batch...
2025-11-14 15:28:10,311 - INFO - Processing document 4_2024-07-17
2025-11-14 15:28:10,338 - INFO - Finished converting document 4_2024-07-17 in 0.05 sec.


Converted 'data\edgar_documents\ADBE\4_2024-06-18' --> 'data\processed_data\ADBE\4_2024-06-18.md'
Converted 'data\edgar_documents\ADBE\4_2024-06-20' --> 'data\processed_data\ADBE\4_2024-06-20.md'
Converted 'data\edgar_documents\ADBE\4_2024-06-28' --> 'data\processed_data\ADBE\4_2024-06-28.md'
Converted 'data\edgar_documents\ADBE\4_2024-07-17' --> 'data\processed_data\ADBE\4_2024-07-17.md'


2025-11-14 15:28:10,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,406 - INFO - Going to convert document batch...
2025-11-14 15:28:10,407 - INFO - Processing document 4_2024-07-26
2025-11-14 15:28:10,429 - INFO - Finished converting document 4_2024-07-26 in 0.06 sec.
2025-11-14 15:28:10,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,469 - INFO - Going to convert document batch...
2025-11-14 15:28:10,470 - INFO - Processing document 4_2024-08-12
2025-11-14 15:28:10,488 - INFO - Finished converting document 4_2024-08-12 in 0.03 sec.
2025-11-14 15:28:10,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,553 - INFO - Going to convert document batch...
2025-11-14 15:28:10,554 - INFO - Processing document 4_2024-08-19
2025-11-14 15:28:10,581 - INFO - Finished converting document 4_2024-08-19 in 0.08 sec.
2025-11-14 15:28:10,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\4_2024-07-26' --> 'data\processed_data\ADBE\4_2024-07-26.md'
Converted 'data\edgar_documents\ADBE\4_2024-08-12' --> 'data\processed_data\ADBE\4_2024-08-12.md'
Converted 'data\edgar_documents\ADBE\4_2024-08-19' --> 'data\processed_data\ADBE\4_2024-08-19.md'


2025-11-14 15:28:10,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,687 - INFO - Going to convert document batch...
2025-11-14 15:28:10,688 - INFO - Processing document 4_2024-09-19
2025-11-14 15:28:10,709 - INFO - Finished converting document 4_2024-09-19 in 0.03 sec.
2025-11-14 15:28:10,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,773 - INFO - Going to convert document batch...
2025-11-14 15:28:10,774 - INFO - Processing document 4_2024-09-26
2025-11-14 15:28:10,801 - INFO - Finished converting document 4_2024-09-26 in 0.06 sec.
2025-11-14 15:28:10,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,850 - INFO - Going to convert document batch...
2025-11-14 15:28:10,851 - INFO - Processing document 4_2024-10-17


Converted 'data\edgar_documents\ADBE\4_2024-09-17' --> 'data\processed_data\ADBE\4_2024-09-17.md'
Converted 'data\edgar_documents\ADBE\4_2024-09-19' --> 'data\processed_data\ADBE\4_2024-09-19.md'
Converted 'data\edgar_documents\ADBE\4_2024-09-26' --> 'data\processed_data\ADBE\4_2024-09-26.md'


2025-11-14 15:28:10,877 - INFO - Finished converting document 4_2024-10-17 in 0.05 sec.
2025-11-14 15:28:10,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,925 - INFO - Going to convert document batch...
2025-11-14 15:28:10,926 - INFO - Processing document 4_2024-10-28
2025-11-14 15:28:10,952 - INFO - Finished converting document 4_2024-10-28 in 0.05 sec.
2025-11-14 15:28:11,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,014 - INFO - Going to convert document batch...
2025-11-14 15:28:11,015 - INFO - Processing document 4_2024-10-31
2025-11-14 15:28:11,035 - INFO - Finished converting document 4_2024-10-31 in 0.06 sec.
2025-11-14 15:28:11,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,095 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ADBE\4_2024-10-17' --> 'data\processed_data\ADBE\4_2024-10-17.md'
Converted 'data\edgar_documents\ADBE\4_2024-10-28' --> 'data\processed_data\ADBE\4_2024-10-28.md'
Converted 'data\edgar_documents\ADBE\4_2024-10-31' --> 'data\processed_data\ADBE\4_2024-10-31.md'


2025-11-14 15:28:11,095 - INFO - Processing document 4_2024-11-19
2025-11-14 15:28:11,117 - INFO - Finished converting document 4_2024-11-19 in 0.06 sec.
2025-11-14 15:28:11,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,155 - INFO - Going to convert document batch...
2025-11-14 15:28:11,156 - INFO - Processing document 4_2024-12-02
2025-11-14 15:28:11,174 - INFO - Finished converting document 4_2024-12-02 in 0.03 sec.
2025-11-14 15:28:11,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,251 - INFO - Going to convert document batch...
2025-11-14 15:28:11,252 - INFO - Processing document 4_2024-12-10
2025-11-14 15:28:11,273 - INFO - Finished converting document 4_2024-12-10 in 0.08 sec.
2025-11-14 15:28:11,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,316 - INFO - Going to convert document batch...
2025-11-14 15:28:11,317 - INFO - Processing document 4_2024-12-17


Converted 'data\edgar_documents\ADBE\4_2024-11-19' --> 'data\processed_data\ADBE\4_2024-11-19.md'
Converted 'data\edgar_documents\ADBE\4_2024-12-02' --> 'data\processed_data\ADBE\4_2024-12-02.md'
Converted 'data\edgar_documents\ADBE\4_2024-12-10' --> 'data\processed_data\ADBE\4_2024-12-10.md'


2025-11-14 15:28:11,350 - INFO - Finished converting document 4_2024-12-17 in 0.05 sec.
2025-11-14 15:28:11,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,397 - INFO - Going to convert document batch...
2025-11-14 15:28:11,398 - INFO - Processing document 4_2025-01-02
2025-11-14 15:28:11,415 - INFO - Finished converting document 4_2025-01-02 in 0.03 sec.
2025-11-14 15:28:11,452 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:11,453 - ERROR - Input document 4_2025-01-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\ADBE\4_2024-12-17' --> 'data\processed_data\ADBE\4_2024-12-17.md'
Converted 'data\edgar_documents\ADBE\4_2025-01-02' --> 'data\processed_data\ADBE\4_2025-01-02.md'
Error processing data\edgar_documents\ADBE\4_2025-01-14: File format not allowed: data\edgar_documents\ADBE\4_2025-01-14
Error processing data\edgar_documents\ADBE\4_2025-01-15: File format not allowed: data\edgar_documents\ADBE\4_2025-01-15
Converted 'data\edgar_documents\ADBE\4_2025-01-17' --> 'data\processed_data\ADBE\4_2025-01-17.md'


2025-11-14 15:28:11,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,620 - INFO - Going to convert document batch...
2025-11-14 15:28:11,621 - INFO - Processing document 4_2025-01-28
2025-11-14 15:28:11,659 - INFO - Finished converting document 4_2025-01-28 in 0.11 sec.
2025-11-14 15:28:11,700 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,708 - INFO - Going to convert document batch...
2025-11-14 15:28:11,709 - INFO - Processing document 4_2025-01-30
2025-11-14 15:28:11,726 - INFO - Finished converting document 4_2025-01-30 in 0.03 sec.
2025-11-14 15:28:11,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,794 - INFO - Going to convert document batch...
2025-11-14 15:28:11,795 - INFO - Processing document 4_2025-03-17
2025-11-14 15:28:11,823 - INFO - Finished converting document 4_2025-03-17 in 0.08 sec.
2025-11-14 15:28:11,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2025-01-28' --> 'data\processed_data\ADBE\4_2025-01-28.md'
Converted 'data\edgar_documents\ADBE\4_2025-01-30' --> 'data\processed_data\ADBE\4_2025-01-30.md'
Converted 'data\edgar_documents\ADBE\4_2025-03-17' --> 'data\processed_data\ADBE\4_2025-03-17.md'


2025-11-14 15:28:11,886 - INFO - Going to convert document batch...
2025-11-14 15:28:11,886 - INFO - Processing document 4_2025-03-21
2025-11-14 15:28:11,906 - INFO - Finished converting document 4_2025-03-21 in 0.06 sec.
2025-11-14 15:28:11,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2025-03-21' --> 'data\processed_data\ADBE\4_2025-03-21.md'


2025-11-14 15:28:12,171 - INFO - Going to convert document batch...
2025-11-14 15:28:12,172 - INFO - Processing document 4_2025-04-17
2025-11-14 15:28:12,203 - INFO - Finished converting document 4_2025-04-17 in 0.28 sec.
2025-11-14 15:28:12,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,256 - INFO - Going to convert document batch...
2025-11-14 15:28:12,257 - INFO - Processing document 4_2025-04-23
2025-11-14 15:28:12,278 - INFO - Finished converting document 4_2025-04-23 in 0.05 sec.
2025-11-14 15:28:12,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,318 - INFO - Going to convert document batch...
2025-11-14 15:28:12,318 - INFO - Processing document 4_2025-04-28
2025-11-14 15:28:12,337 - INFO - Finished converting document 4_2025-04-28 in 0.03 sec.
2025-11-14 15:28:12,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,394 - INFO - Going to convert document batch...
2025-11-14 15:28:12,395 - 

Converted 'data\edgar_documents\ADBE\4_2025-04-17' --> 'data\processed_data\ADBE\4_2025-04-17.md'
Converted 'data\edgar_documents\ADBE\4_2025-04-23' --> 'data\processed_data\ADBE\4_2025-04-23.md'
Converted 'data\edgar_documents\ADBE\4_2025-04-28' --> 'data\processed_data\ADBE\4_2025-04-28.md'


2025-11-14 15:28:12,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,454 - INFO - Going to convert document batch...
2025-11-14 15:28:12,455 - INFO - Processing document 4_2025-06-16
2025-11-14 15:28:12,475 - INFO - Finished converting document 4_2025-06-16 in 0.03 sec.
2025-11-14 15:28:12,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,520 - INFO - Going to convert document batch...
2025-11-14 15:28:12,521 - INFO - Processing document 4_2025-07-17
2025-11-14 15:28:12,551 - INFO - Finished converting document 4_2025-07-17 in 0.05 sec.
2025-11-14 15:28:12,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,598 - INFO - Going to convert document batch...
2025-11-14 15:28:12,599 - INFO - Processing document 4_2025-07-28
2025-11-14 15:28:12,622 - INFO - Finished converting document 4_2025-07-28 in 0.05 sec.


Converted 'data\edgar_documents\ADBE\4_2025-05-06' --> 'data\processed_data\ADBE\4_2025-05-06.md'
Converted 'data\edgar_documents\ADBE\4_2025-06-16' --> 'data\processed_data\ADBE\4_2025-06-16.md'
Converted 'data\edgar_documents\ADBE\4_2025-07-17' --> 'data\processed_data\ADBE\4_2025-07-17.md'


2025-11-14 15:28:12,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,669 - INFO - Going to convert document batch...
2025-11-14 15:28:12,670 - INFO - Processing document 4_2025-09-17
2025-11-14 15:28:12,700 - INFO - Finished converting document 4_2025-09-17 in 0.06 sec.
2025-11-14 15:28:12,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,768 - INFO - Going to convert document batch...
2025-11-14 15:28:12,769 - INFO - Processing document 4_2025-10-16
2025-11-14 15:28:12,798 - INFO - Finished converting document 4_2025-10-16 in 0.08 sec.


Converted 'data\edgar_documents\ADBE\4_2025-07-28' --> 'data\processed_data\ADBE\4_2025-07-28.md'
Converted 'data\edgar_documents\ADBE\4_2025-09-17' --> 'data\processed_data\ADBE\4_2025-09-17.md'
Converted 'data\edgar_documents\ADBE\4_2025-10-16' --> 'data\processed_data\ADBE\4_2025-10-16.md'


2025-11-14 15:28:12,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,863 - INFO - Going to convert document batch...
2025-11-14 15:28:12,864 - INFO - Processing document 4_2025-10-27
2025-11-14 15:28:12,885 - INFO - Finished converting document 4_2025-10-27 in 0.06 sec.
2025-11-14 15:28:12,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,931 - INFO - Going to convert document batch...
2025-11-14 15:28:12,931 - INFO - Processing document 4_2025-11-04
2025-11-14 15:28:12,948 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 15:28:12,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,988 - INFO - Going to convert document batch...
2025-11-14 15:28:12,989 - INFO - Processing document 8-K_2023-01-19
2025-11-14 15:28:13,005 - INFO - Finished converting document 8-K_2023-01-19 in 0.03 sec.
2025-11-14 15:28:13,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14

Converted 'data\edgar_documents\ADBE\4_2025-10-27' --> 'data\processed_data\ADBE\4_2025-10-27.md'
Converted 'data\edgar_documents\ADBE\4_2025-11-04' --> 'data\processed_data\ADBE\4_2025-11-04.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-01-19' --> 'data\processed_data\ADBE\8-K_2023-01-19.md'


2025-11-14 15:28:13,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,181 - INFO - Going to convert document batch...
2025-11-14 15:28:13,182 - INFO - Processing document 8-K_2023-03-15
2025-11-14 15:28:13,200 - INFO - Finished converting document 8-K_2023-03-15 in 0.06 sec.
2025-11-14 15:28:13,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,279 - INFO - Going to convert document batch...
2025-11-14 15:28:13,279 - INFO - Processing document 8-K_2023-04-24
2025-11-14 15:28:13,322 - INFO - Finished converting document 8-K_2023-04-24 in 0.11 sec.
2025-11-14 15:28:13,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\8-K_2023-01-26' --> 'data\processed_data\ADBE\8-K_2023-01-26.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-03-15' --> 'data\processed_data\ADBE\8-K_2023-03-15.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-04-24' --> 'data\processed_data\ADBE\8-K_2023-04-24.md'


2025-11-14 15:28:13,369 - INFO - Going to convert document batch...
2025-11-14 15:28:13,370 - INFO - Processing document 8-K_2023-06-15
2025-11-14 15:28:13,387 - INFO - Finished converting document 8-K_2023-06-15 in 0.05 sec.
2025-11-14 15:28:13,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,420 - INFO - Going to convert document batch...
2025-11-14 15:28:13,421 - INFO - Processing document 8-K_2023-09-14
2025-11-14 15:28:13,440 - INFO - Finished converting document 8-K_2023-09-14 in 0.05 sec.
2025-11-14 15:28:13,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,491 - INFO - Going to convert document batch...
2025-11-14 15:28:13,492 - INFO - Processing document 8-K_2023-10-26
2025-11-14 15:28:13,514 - INFO - Finished converting document 8-K_2023-10-26 in 0.06 sec.
2025-11-14 15:28:13,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,551 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\8-K_2023-06-15' --> 'data\processed_data\ADBE\8-K_2023-06-15.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-09-14' --> 'data\processed_data\ADBE\8-K_2023-09-14.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-10-26' --> 'data\processed_data\ADBE\8-K_2023-10-26.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-12-13' --> 'data\processed_data\ADBE\8-K_2023-12-13.md'


2025-11-14 15:28:13,603 - INFO - Going to convert document batch...
2025-11-14 15:28:13,603 - INFO - Processing document 8-K_2023-12-18
2025-11-14 15:28:13,624 - INFO - Finished converting document 8-K_2023-12-18 in 0.05 sec.
2025-11-14 15:28:13,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,699 - INFO - Going to convert document batch...
2025-11-14 15:28:13,700 - INFO - Processing document 8-K_2024-01-26
2025-11-14 15:28:13,739 - INFO - Finished converting document 8-K_2024-01-26 in 0.09 sec.
2025-11-14 15:28:13,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,782 - INFO - Going to convert document batch...
2025-11-14 15:28:13,783 - INFO - Processing document 8-K_2024-03-14
2025-11-14 15:28:13,801 - INFO - Finished converting document 8-K_2024-03-14 in 0.03 sec.
2025-11-14 15:28:13,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,833 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ADBE\8-K_2023-12-18' --> 'data\processed_data\ADBE\8-K_2023-12-18.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-01-26' --> 'data\processed_data\ADBE\8-K_2024-01-26.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-03-14' --> 'data\processed_data\ADBE\8-K_2024-03-14.md'


2025-11-14 15:28:13,834 - INFO - Processing document 8-K_2024-04-04
2025-11-14 15:28:13,857 - INFO - Finished converting document 8-K_2024-04-04 in 0.05 sec.
2025-11-14 15:28:13,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,904 - INFO - Going to convert document batch...
2025-11-14 15:28:13,905 - INFO - Processing document 8-K_2024-04-19
2025-11-14 15:28:13,947 - INFO - Finished converting document 8-K_2024-04-19 in 0.06 sec.
2025-11-14 15:28:13,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,993 - INFO - Going to convert document batch...
2025-11-14 15:28:13,994 - INFO - Processing document 8-K_2024-06-13
2025-11-14 15:28:14,011 - INFO - Finished converting document 8-K_2024-06-13 in 0.05 sec.
2025-11-14 15:28:14,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,038 - INFO - Going to convert document batch...
2025-11-14 15:28:14,039 - INFO - Processing document 8-K_2024-07-18
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\8-K_2024-04-04' --> 'data\processed_data\ADBE\8-K_2024-04-04.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-04-19' --> 'data\processed_data\ADBE\8-K_2024-04-19.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-06-13' --> 'data\processed_data\ADBE\8-K_2024-06-13.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-07-18' --> 'data\processed_data\ADBE\8-K_2024-07-18.md'


2025-11-14 15:28:14,073 - INFO - Going to convert document batch...
2025-11-14 15:28:14,074 - INFO - Processing document 8-K_2024-08-08
2025-11-14 15:28:14,087 - INFO - Finished converting document 8-K_2024-08-08 in 0.02 sec.
2025-11-14 15:28:14,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,125 - INFO - Going to convert document batch...
2025-11-14 15:28:14,126 - INFO - Processing document 8-K_2024-09-12
2025-11-14 15:28:14,141 - INFO - Finished converting document 8-K_2024-09-12 in 0.05 sec.
2025-11-14 15:28:14,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,172 - INFO - Going to convert document batch...
2025-11-14 15:28:14,173 - INFO - Processing document 8-K_2024-12-11
2025-11-14 15:28:14,189 - INFO - Finished converting document 8-K_2024-12-11 in 0.05 sec.
2025-11-14 15:28:14,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,224 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\8-K_2024-08-08' --> 'data\processed_data\ADBE\8-K_2024-08-08.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-09-12' --> 'data\processed_data\ADBE\8-K_2024-09-12.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-12-11' --> 'data\processed_data\ADBE\8-K_2024-12-11.md'
Converted 'data\edgar_documents\ADBE\8-K_2025-01-17' --> 'data\processed_data\ADBE\8-K_2025-01-17.md'


2025-11-14 15:28:14,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,317 - INFO - Going to convert document batch...
2025-11-14 15:28:14,318 - INFO - Processing document 8-K_2025-01-30
2025-11-14 15:28:14,353 - INFO - Finished converting document 8-K_2025-01-30 in 0.08 sec.
2025-11-14 15:28:14,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,423 - INFO - Going to convert document batch...
2025-11-14 15:28:14,424 - INFO - Processing document 8-K_2025-03-12
2025-11-14 15:28:14,439 - INFO - Finished converting document 8-K_2025-03-12 in 0.06 sec.
2025-11-14 15:28:14,478 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,504 - INFO - Going to convert document batch...
2025-11-14 15:28:14,506 - INFO - Processing document 8-K_2025-04-24
2025-11-14 15:28:14,548 - INFO - Finished converting document 8-K_2025-04-24 in 0.09 sec.


Converted 'data\edgar_documents\ADBE\8-K_2025-01-30' --> 'data\processed_data\ADBE\8-K_2025-01-30.md'
Converted 'data\edgar_documents\ADBE\8-K_2025-03-12' --> 'data\processed_data\ADBE\8-K_2025-03-12.md'


2025-11-14 15:28:14,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,622 - INFO - Going to convert document batch...
2025-11-14 15:28:14,622 - INFO - Processing document 8-K_2025-06-12
2025-11-14 15:28:14,642 - INFO - Finished converting document 8-K_2025-06-12 in 0.08 sec.
2025-11-14 15:28:14,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,671 - INFO - Going to convert document batch...
2025-11-14 15:28:14,672 - INFO - Processing document 8-K_2025-09-11
2025-11-14 15:28:14,688 - INFO - Finished converting document 8-K_2025-09-11 in 0.05 sec.
2025-11-14 15:28:14,728 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:14,730 - ERROR - Input document DEF-14A_2023-03-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF

Converted 'data\edgar_documents\ADBE\8-K_2025-04-24' --> 'data\processed_data\ADBE\8-K_2025-04-24.md'
Converted 'data\edgar_documents\ADBE\8-K_2025-06-12' --> 'data\processed_data\ADBE\8-K_2025-06-12.md'
Converted 'data\edgar_documents\ADBE\8-K_2025-09-11' --> 'data\processed_data\ADBE\8-K_2025-09-11.md'
Error processing data\edgar_documents\ADBE\DEF-14A_2023-03-03: File format not allowed: data\edgar_documents\ADBE\DEF-14A_2023-03-03


2025-11-14 15:28:15,359 - INFO - Going to convert document batch...
2025-11-14 15:28:15,360 - INFO - Processing document DEF-14A_2024-03-01
2025-11-14 15:28:16,656 - INFO - Finished converting document DEF-14A_2024-03-01 in 1.92 sec.
2025-11-14 15:28:17,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\DEF-14A_2024-03-01' --> 'data\processed_data\ADBE\DEF-14A_2024-03-01.md'


2025-11-14 15:28:18,158 - INFO - Going to convert document batch...
2025-11-14 15:28:18,158 - INFO - Processing document DEF-14A_2025-02-28
2025-11-14 15:28:19,622 - INFO - Finished converting document DEF-14A_2025-02-28 in 2.16 sec.


Converted 'data\edgar_documents\ADBE\DEF-14A_2025-02-28' --> 'data\processed_data\ADBE\DEF-14A_2025-02-28.md'
Processed 121 new files. Errors: 6
Found 164 files to process in data\edgar_documents\AIG


2025-11-14 15:28:20,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:25,018 - INFO - Going to convert document batch...
2025-11-14 15:28:25,019 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:28:25,020 - INFO - Processing document 10-K_2023-02-17
2025-11-14 15:28:43,429 - INFO - Finished converting document 10-K_2023-02-17 in 22.84 sec.


Converted 'data\edgar_documents\AIG\10-K_2023-02-17' --> 'data\processed_data\AIG\10-K_2023-02-17.md'


2025-11-14 15:28:47,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:52,206 - INFO - Going to convert document batch...
2025-11-14 15:28:52,207 - INFO - Processing document 10-K_2024-02-14
2025-11-14 15:29:15,849 - INFO - Finished converting document 10-K_2024-02-14 in 29.14 sec.


Converted 'data\edgar_documents\AIG\10-K_2024-02-14' --> 'data\processed_data\AIG\10-K_2024-02-14.md'


2025-11-14 15:29:20,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:29:24,547 - INFO - Going to convert document batch...
2025-11-14 15:29:24,548 - INFO - Processing document 10-K_2025-02-13
2025-11-14 15:29:38,823 - INFO - Finished converting document 10-K_2025-02-13 in 19.08 sec.


Converted 'data\edgar_documents\AIG\10-K_2025-02-13' --> 'data\processed_data\AIG\10-K_2025-02-13.md'


2025-11-14 15:29:42,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:29:45,910 - INFO - Going to convert document batch...
2025-11-14 15:29:45,911 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 15:29:53,882 - INFO - Finished converting document 10-Q_2023-05-05 in 11.97 sec.


Converted 'data\edgar_documents\AIG\10-Q_2023-05-05' --> 'data\processed_data\AIG\10-Q_2023-05-05.md'


2025-11-14 15:29:57,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:30:09,326 - INFO - Going to convert document batch...
2025-11-14 15:30:09,327 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 15:30:31,894 - INFO - Finished converting document 10-Q_2023-08-02 in 34.20 sec.


Converted 'data\edgar_documents\AIG\10-Q_2023-08-02' --> 'data\processed_data\AIG\10-Q_2023-08-02.md'


2025-11-14 15:30:36,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:30:39,624 - INFO - Going to convert document batch...
2025-11-14 15:30:39,625 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 15:30:49,531 - INFO - Finished converting document 10-Q_2023-11-02 in 13.62 sec.
2025-11-14 15:30:52,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2023-11-02' --> 'data\processed_data\AIG\10-Q_2023-11-02.md'


2025-11-14 15:30:55,901 - INFO - Going to convert document batch...
2025-11-14 15:30:55,902 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 15:31:01,337 - INFO - Finished converting document 10-Q_2024-05-02 in 9.05 sec.
2025-11-14 15:31:03,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2024-05-02' --> 'data\processed_data\AIG\10-Q_2024-05-02.md'


2025-11-14 15:31:06,700 - INFO - Going to convert document batch...
2025-11-14 15:31:06,700 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 15:31:12,993 - INFO - Finished converting document 10-Q_2024-08-01 in 9.61 sec.
2025-11-14 15:31:15,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2024-08-01' --> 'data\processed_data\AIG\10-Q_2024-08-01.md'


2025-11-14 15:31:18,053 - INFO - Going to convert document batch...
2025-11-14 15:31:18,054 - INFO - Processing document 10-Q_2024-11-07
2025-11-14 15:31:23,308 - INFO - Finished converting document 10-Q_2024-11-07 in 8.27 sec.
2025-11-14 15:31:25,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2024-11-07' --> 'data\processed_data\AIG\10-Q_2024-11-07.md'


2025-11-14 15:31:27,665 - INFO - Going to convert document batch...
2025-11-14 15:31:27,666 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 15:31:31,646 - INFO - Finished converting document 10-Q_2025-05-02 in 6.44 sec.
2025-11-14 15:31:33,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2025-05-02' --> 'data\processed_data\AIG\10-Q_2025-05-02.md'


2025-11-14 15:31:36,023 - INFO - Going to convert document batch...
2025-11-14 15:31:36,025 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 15:31:41,229 - INFO - Finished converting document 10-Q_2025-08-07 in 8.12 sec.
2025-11-14 15:31:43,478 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:31:43,479 - ERROR - Input document 10-Q_2025-11-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:31:43,484 - INFO - Going to convert d

Converted 'data\edgar_documents\AIG\10-Q_2025-08-07' --> 'data\processed_data\AIG\10-Q_2025-08-07.md'
Error processing data\edgar_documents\AIG\10-Q_2025-11-05: File format not allowed: data\edgar_documents\AIG\10-Q_2025-11-05


2025-11-14 15:31:43,534 - INFO - Finished converting document 4_2023-01-03 in 0.05 sec.
2025-11-14 15:31:43,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:43,613 - INFO - Going to convert document batch...
2025-11-14 15:31:43,614 - INFO - Processing document 4_2023-01-05
2025-11-14 15:31:43,641 - INFO - Finished converting document 4_2023-01-05 in 0.06 sec.
2025-11-14 15:31:43,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:43,693 - INFO - Going to convert document batch...
2025-11-14 15:31:43,694 - INFO - Processing document 4_2023-01-18
2025-11-14 15:31:43,717 - INFO - Finished converting document 4_2023-01-18 in 0.05 sec.
2025-11-14 15:31:43,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2023-01-03' --> 'data\processed_data\AIG\4_2023-01-03.md'
Converted 'data\edgar_documents\AIG\4_2023-01-05' --> 'data\processed_data\AIG\4_2023-01-05.md'
Converted 'data\edgar_documents\AIG\4_2023-01-18' --> 'data\processed_data\AIG\4_2023-01-18.md'


2025-11-14 15:31:43,797 - INFO - Going to convert document batch...
2025-11-14 15:31:43,797 - INFO - Processing document 4_2023-02-14
2025-11-14 15:31:43,830 - INFO - Finished converting document 4_2023-02-14 in 0.09 sec.
2025-11-14 15:31:43,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:43,884 - INFO - Going to convert document batch...
2025-11-14 15:31:43,886 - INFO - Processing document 4_2023-02-16
2025-11-14 15:31:43,911 - INFO - Finished converting document 4_2023-02-16 in 0.05 sec.
2025-11-14 15:31:43,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:43,967 - INFO - Going to convert document batch...
2025-11-14 15:31:43,967 - INFO - Processing document 4_2023-02-23
2025-11-14 15:31:43,990 - INFO - Finished converting document 4_2023-02-23 in 0.05 sec.
2025-11-14 15:31:44,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,032 - INFO - Going to convert document batch...
2025-11-14 15:31:44,033 - 

Converted 'data\edgar_documents\AIG\4_2023-02-14' --> 'data\processed_data\AIG\4_2023-02-14.md'
Converted 'data\edgar_documents\AIG\4_2023-02-16' --> 'data\processed_data\AIG\4_2023-02-16.md'
Converted 'data\edgar_documents\AIG\4_2023-02-23' --> 'data\processed_data\AIG\4_2023-02-23.md'


2025-11-14 15:31:44,054 - INFO - Finished converting document 4_2023-03-02 in 0.03 sec.
2025-11-14 15:31:44,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,109 - INFO - Going to convert document batch...
2025-11-14 15:31:44,110 - INFO - Processing document 4_2023-03-17
2025-11-14 15:31:44,133 - INFO - Finished converting document 4_2023-03-17 in 0.05 sec.
2025-11-14 15:31:44,209 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:31:44,209 - ERROR - Input document 4_2023-03-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\AIG\4_2023-03-02' --> 'data\processed_data\AIG\4_2023-03-02.md'
Converted 'data\edgar_documents\AIG\4_2023-03-17' --> 'data\processed_data\AIG\4_2023-03-17.md'
Error processing data\edgar_documents\AIG\4_2023-03-23: File format not allowed: data\edgar_documents\AIG\4_2023-03-23
Error processing data\edgar_documents\AIG\4_2023-03-24: File format not allowed: data\edgar_documents\AIG\4_2023-03-24


2025-11-14 15:31:44,267 - INFO - Processing document 4_2023-04-04
2025-11-14 15:31:44,295 - INFO - Finished converting document 4_2023-04-04 in 0.06 sec.
2025-11-14 15:31:44,354 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,364 - INFO - Going to convert document batch...
2025-11-14 15:31:44,365 - INFO - Processing document 4_2023-04-05
2025-11-14 15:31:44,390 - INFO - Finished converting document 4_2023-04-05 in 0.06 sec.
2025-11-14 15:31:44,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,451 - INFO - Going to convert document batch...
2025-11-14 15:31:44,452 - INFO - Processing document 4_2023-04-18
2025-11-14 15:31:44,474 - INFO - Finished converting document 4_2023-04-18 in 0.05 sec.


Converted 'data\edgar_documents\AIG\4_2023-04-04' --> 'data\processed_data\AIG\4_2023-04-04.md'
Converted 'data\edgar_documents\AIG\4_2023-04-05' --> 'data\processed_data\AIG\4_2023-04-05.md'
Converted 'data\edgar_documents\AIG\4_2023-04-18' --> 'data\processed_data\AIG\4_2023-04-18.md'


2025-11-14 15:31:44,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,560 - INFO - Going to convert document batch...
2025-11-14 15:31:44,561 - INFO - Processing document 4_2023-05-12
2025-11-14 15:31:44,587 - INFO - Finished converting document 4_2023-05-12 in 0.08 sec.
2025-11-14 15:31:44,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,653 - INFO - Going to convert document batch...
2025-11-14 15:31:44,654 - INFO - Processing document 4_2023-06-12
2025-11-14 15:31:44,674 - INFO - Finished converting document 4_2023-06-12 in 0.06 sec.
2025-11-14 15:31:44,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,739 - INFO - Going to convert document batch...
2025-11-14 15:31:44,740 - INFO - Processing document 4_2023-06-16
2025-11-14 15:31:44,775 - INFO - Finished converting document 4_2023-06-16 in 0.06 sec.


Converted 'data\edgar_documents\AIG\4_2023-05-12' --> 'data\processed_data\AIG\4_2023-05-12.md'
Converted 'data\edgar_documents\AIG\4_2023-06-12' --> 'data\processed_data\AIG\4_2023-06-12.md'


2025-11-14 15:31:44,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,845 - INFO - Going to convert document batch...
2025-11-14 15:31:44,846 - INFO - Processing document 4_2023-06-21
2025-11-14 15:31:44,869 - INFO - Finished converting document 4_2023-06-21 in 0.05 sec.
2025-11-14 15:31:44,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,945 - INFO - Going to convert document batch...
2025-11-14 15:31:44,945 - INFO - Processing document 4_2023-06-23
2025-11-14 15:31:44,965 - INFO - Finished converting document 4_2023-06-23 in 0.08 sec.
2025-11-14 15:31:45,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2023-06-16' --> 'data\processed_data\AIG\4_2023-06-16.md'
Converted 'data\edgar_documents\AIG\4_2023-06-21' --> 'data\processed_data\AIG\4_2023-06-21.md'
Converted 'data\edgar_documents\AIG\4_2023-06-23' --> 'data\processed_data\AIG\4_2023-06-23.md'


2025-11-14 15:31:45,025 - INFO - Going to convert document batch...
2025-11-14 15:31:45,026 - INFO - Processing document 4_2023-07-05
2025-11-14 15:31:45,051 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 15:31:45,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,112 - INFO - Going to convert document batch...
2025-11-14 15:31:45,112 - INFO - Processing document 4_2023-07-06
2025-11-14 15:31:45,136 - INFO - Finished converting document 4_2023-07-06 in 0.06 sec.
2025-11-14 15:31:45,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,216 - INFO - Going to convert document batch...
2025-11-14 15:31:45,217 - INFO - Processing document 4_2023-07-26


Converted 'data\edgar_documents\AIG\4_2023-07-05' --> 'data\processed_data\AIG\4_2023-07-05.md'
Converted 'data\edgar_documents\AIG\4_2023-07-06' --> 'data\processed_data\AIG\4_2023-07-06.md'


2025-11-14 15:31:45,296 - INFO - Finished converting document 4_2023-07-26 in 0.12 sec.
2025-11-14 15:31:45,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,400 - INFO - Going to convert document batch...
2025-11-14 15:31:45,401 - INFO - Processing document 4_2023-08-07
2025-11-14 15:31:45,440 - INFO - Finished converting document 4_2023-08-07 in 0.08 sec.
2025-11-14 15:31:45,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,504 - INFO - Going to convert document batch...
2025-11-14 15:31:45,505 - INFO - Processing document 4_2023-08-11
2025-11-14 15:31:45,524 - INFO - Finished converting document 4_2023-08-11 in 0.05 sec.
2025-11-14 15:31:45,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2023-07-26' --> 'data\processed_data\AIG\4_2023-07-26.md'
Converted 'data\edgar_documents\AIG\4_2023-08-07' --> 'data\processed_data\AIG\4_2023-08-07.md'
Converted 'data\edgar_documents\AIG\4_2023-08-11' --> 'data\processed_data\AIG\4_2023-08-11.md'


2025-11-14 15:31:45,580 - INFO - Going to convert document batch...
2025-11-14 15:31:45,581 - INFO - Processing document 4_2023-10-03
2025-11-14 15:31:45,605 - INFO - Finished converting document 4_2023-10-03 in 0.06 sec.
2025-11-14 15:31:45,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,670 - INFO - Going to convert document batch...
2025-11-14 15:31:45,670 - INFO - Processing document 4_2023-10-17
2025-11-14 15:31:45,706 - INFO - Finished converting document 4_2023-10-17 in 0.08 sec.
2025-11-14 15:31:45,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,776 - INFO - Going to convert document batch...
2025-11-14 15:31:45,776 - INFO - Processing document 4_2023-10-18
2025-11-14 15:31:45,807 - INFO - Finished converting document 4_2023-10-18 in 0.06 sec.


Converted 'data\edgar_documents\AIG\4_2023-10-03' --> 'data\processed_data\AIG\4_2023-10-03.md'
Converted 'data\edgar_documents\AIG\4_2023-10-17' --> 'data\processed_data\AIG\4_2023-10-17.md'


2025-11-14 15:31:45,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,859 - INFO - Going to convert document batch...
2025-11-14 15:31:45,860 - INFO - Processing document 4_2023-11-13
2025-11-14 15:31:45,883 - INFO - Finished converting document 4_2023-11-13 in 0.05 sec.
2025-11-14 15:31:45,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,933 - INFO - Going to convert document batch...
2025-11-14 15:31:45,934 - INFO - Processing document 4_2023-12-05
2025-11-14 15:31:45,961 - INFO - Finished converting document 4_2023-12-05 in 0.05 sec.
2025-11-14 15:31:46,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:46,018 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\4_2023-10-18' --> 'data\processed_data\AIG\4_2023-10-18.md'
Converted 'data\edgar_documents\AIG\4_2023-11-13' --> 'data\processed_data\AIG\4_2023-11-13.md'
Converted 'data\edgar_documents\AIG\4_2023-12-05' --> 'data\processed_data\AIG\4_2023-12-05.md'


2025-11-14 15:31:46,019 - INFO - Processing document 4_2023-12-12
2025-11-14 15:31:46,048 - INFO - Finished converting document 4_2023-12-12 in 0.06 sec.
2025-11-14 15:31:46,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:46,101 - INFO - Going to convert document batch...
2025-11-14 15:31:46,101 - INFO - Processing document 4_2023-12-18
2025-11-14 15:31:46,131 - INFO - Finished converting document 4_2023-12-18 in 0.05 sec.
2025-11-14 15:31:46,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2023-12-12' --> 'data\processed_data\AIG\4_2023-12-12.md'
Converted 'data\edgar_documents\AIG\4_2023-12-18' --> 'data\processed_data\AIG\4_2023-12-18.md'


2025-11-14 15:31:46,902 - INFO - Going to convert document batch...
2025-11-14 15:31:46,904 - INFO - Processing document 4_2023-12-19
2025-11-14 15:31:46,927 - INFO - Finished converting document 4_2023-12-19 in 0.77 sec.
2025-11-14 15:31:46,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:46,980 - INFO - Going to convert document batch...
2025-11-14 15:31:46,981 - INFO - Processing document 4_2023-12-21
2025-11-14 15:31:47,022 - INFO - Finished converting document 4_2023-12-21 in 0.06 sec.
2025-11-14 15:31:47,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,081 - INFO - Going to convert document batch...
2025-11-14 15:31:47,082 - INFO - Processing document 4_2024-01-02
2025-11-14 15:31:47,111 - INFO - Finished converting document 4_2024-01-02 in 0.05 sec.


Converted 'data\edgar_documents\AIG\4_2023-12-19' --> 'data\processed_data\AIG\4_2023-12-19.md'
Converted 'data\edgar_documents\AIG\4_2023-12-21' --> 'data\processed_data\AIG\4_2023-12-21.md'
Converted 'data\edgar_documents\AIG\4_2024-01-02' --> 'data\processed_data\AIG\4_2024-01-02.md'


2025-11-14 15:31:47,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,163 - INFO - Going to convert document batch...
2025-11-14 15:31:47,164 - INFO - Processing document 4_2024-01-03
2025-11-14 15:31:47,190 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:31:47,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,238 - INFO - Going to convert document batch...
2025-11-14 15:31:47,239 - INFO - Processing document 4_2024-01-04
2025-11-14 15:31:47,263 - INFO - Finished converting document 4_2024-01-04 in 0.05 sec.
2025-11-14 15:31:47,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,326 - INFO - Going to convert document batch...
2025-11-14 15:31:47,327 - INFO - Processing document 4_2024-01-17
2025-11-14 15:31:47,348 - INFO - Finished converting document 4_2024-01-17 in 0.06 sec.
2025-11-14 15:31:47,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AIG\4_2024-01-03' --> 'data\processed_data\AIG\4_2024-01-03.md'
Converted 'data\edgar_documents\AIG\4_2024-01-04' --> 'data\processed_data\AIG\4_2024-01-04.md'
Converted 'data\edgar_documents\AIG\4_2024-01-17' --> 'data\processed_data\AIG\4_2024-01-17.md'


2025-11-14 15:31:47,419 - INFO - Processing document 4_2024-02-08
2025-11-14 15:31:47,469 - INFO - Finished converting document 4_2024-02-08 in 0.09 sec.
2025-11-14 15:31:47,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,534 - INFO - Going to convert document batch...
2025-11-14 15:31:47,535 - INFO - Processing document 4_2024-02-22
2025-11-14 15:31:47,562 - INFO - Finished converting document 4_2024-02-22 in 0.06 sec.
2025-11-14 15:31:47,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,607 - INFO - Going to convert document batch...
2025-11-14 15:31:47,607 - INFO - Processing document 4_2024-02-27
2025-11-14 15:31:47,626 - INFO - Finished converting document 4_2024-02-27 in 0.05 sec.
2025-11-14 15:31:47,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,666 - INFO - Going to convert document batch...
2025-11-14 15:31:47,667 - INFO - Processing document 4_2024-02-29
2025-11-14 15:31:47,686 - IN

Converted 'data\edgar_documents\AIG\4_2024-02-08' --> 'data\processed_data\AIG\4_2024-02-08.md'
Converted 'data\edgar_documents\AIG\4_2024-02-22' --> 'data\processed_data\AIG\4_2024-02-22.md'
Converted 'data\edgar_documents\AIG\4_2024-02-27' --> 'data\processed_data\AIG\4_2024-02-27.md'


2025-11-14 15:31:47,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,741 - INFO - Going to convert document batch...
2025-11-14 15:31:47,742 - INFO - Processing document 4_2024-03-05
2025-11-14 15:31:47,773 - INFO - Finished converting document 4_2024-03-05 in 0.06 sec.
2025-11-14 15:31:47,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,818 - INFO - Going to convert document batch...
2025-11-14 15:31:47,819 - INFO - Processing document 4_2024-03-18
2025-11-14 15:31:47,840 - INFO - Finished converting document 4_2024-03-18 in 0.05 sec.


Converted 'data\edgar_documents\AIG\4_2024-02-29' --> 'data\processed_data\AIG\4_2024-02-29.md'
Converted 'data\edgar_documents\AIG\4_2024-03-05' --> 'data\processed_data\AIG\4_2024-03-05.md'
Converted 'data\edgar_documents\AIG\4_2024-03-18' --> 'data\processed_data\AIG\4_2024-03-18.md'


2025-11-14 15:31:47,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,923 - INFO - Going to convert document batch...
2025-11-14 15:31:47,924 - INFO - Processing document 4_2024-03-29
2025-11-14 15:31:47,945 - INFO - Finished converting document 4_2024-03-29 in 0.08 sec.
2025-11-14 15:31:47,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,009 - INFO - Going to convert document batch...
2025-11-14 15:31:48,010 - INFO - Processing document 4_2024-04-03
2025-11-14 15:31:48,030 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 15:31:48,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,072 - INFO - Going to convert document batch...
2025-11-14 15:31:48,073 - INFO - Processing document 4_2024-05-17
2025-11-14 15:31:48,092 - INFO - Finished converting document 4_2024-05-17 in 0.05 sec.
2025-11-14 15:31:48,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AIG\4_2024-03-29' --> 'data\processed_data\AIG\4_2024-03-29.md'
Converted 'data\edgar_documents\AIG\4_2024-04-03' --> 'data\processed_data\AIG\4_2024-04-03.md'
Converted 'data\edgar_documents\AIG\4_2024-05-17' --> 'data\processed_data\AIG\4_2024-05-17.md'


2025-11-14 15:31:48,215 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,226 - INFO - Going to convert document batch...
2025-11-14 15:31:48,227 - INFO - Processing document 4_2024-06-11
2025-11-14 15:31:48,255 - INFO - Finished converting document 4_2024-06-11 in 0.08 sec.
2025-11-14 15:31:48,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,299 - INFO - Going to convert document batch...
2025-11-14 15:31:48,300 - INFO - Processing document 4_2024-06-14
2025-11-14 15:31:48,322 - INFO - Finished converting document 4_2024-06-14 in 0.03 sec.
2025-11-14 15:31:48,355 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2024-06-03' --> 'data\processed_data\AIG\4_2024-06-03.md'
Converted 'data\edgar_documents\AIG\4_2024-06-11' --> 'data\processed_data\AIG\4_2024-06-11.md'
Converted 'data\edgar_documents\AIG\4_2024-06-14' --> 'data\processed_data\AIG\4_2024-06-14.md'


2025-11-14 15:31:48,363 - INFO - Going to convert document batch...
2025-11-14 15:31:48,364 - INFO - Processing document 4_2024-06-18
2025-11-14 15:31:48,385 - INFO - Finished converting document 4_2024-06-18 in 0.03 sec.
2025-11-14 15:31:48,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,432 - INFO - Going to convert document batch...
2025-11-14 15:31:48,433 - INFO - Processing document 4_2024-06-21
2025-11-14 15:31:48,455 - INFO - Finished converting document 4_2024-06-21 in 0.05 sec.
2025-11-14 15:31:48,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,506 - INFO - Going to convert document batch...
2025-11-14 15:31:48,507 - INFO - Processing document 4_2024-07-01
2025-11-14 15:31:48,528 - INFO - Finished converting document 4_2024-07-01 in 0.06 sec.
2025-11-14 15:31:48,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,583 - INFO - Going to convert document batch...
2025-11-14 15:31:48,584 - 

Converted 'data\edgar_documents\AIG\4_2024-06-18' --> 'data\processed_data\AIG\4_2024-06-18.md'
Converted 'data\edgar_documents\AIG\4_2024-06-21' --> 'data\processed_data\AIG\4_2024-06-21.md'
Converted 'data\edgar_documents\AIG\4_2024-07-01' --> 'data\processed_data\AIG\4_2024-07-01.md'


2025-11-14 15:31:48,606 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.
2025-11-14 15:31:48,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,656 - INFO - Going to convert document batch...
2025-11-14 15:31:48,657 - INFO - Processing document 4_2024-07-30
2025-11-14 15:31:48,681 - INFO - Finished converting document 4_2024-07-30 in 0.05 sec.
2025-11-14 15:31:48,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,726 - INFO - Going to convert document batch...
2025-11-14 15:31:48,727 - INFO - Processing document 4_2024-08-07
2025-11-14 15:31:48,748 - INFO - Finished converting document 4_2024-08-07 in 0.05 sec.
2025-11-14 15:31:48,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,802 - INFO - Going to convert document batch...
2025-11-14 15:31:48,802 - INFO - Processing document 4_2024-08-19


Converted 'data\edgar_documents\AIG\4_2024-07-02' --> 'data\processed_data\AIG\4_2024-07-02.md'
Converted 'data\edgar_documents\AIG\4_2024-07-30' --> 'data\processed_data\AIG\4_2024-07-30.md'
Converted 'data\edgar_documents\AIG\4_2024-08-07' --> 'data\processed_data\AIG\4_2024-08-07.md'


2025-11-14 15:31:48,824 - INFO - Finished converting document 4_2024-08-19 in 0.06 sec.
2025-11-14 15:31:48,866 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,874 - INFO - Going to convert document batch...
2025-11-14 15:31:48,874 - INFO - Processing document 4_2024-09-18
2025-11-14 15:31:48,894 - INFO - Finished converting document 4_2024-09-18 in 0.03 sec.
2025-11-14 15:31:48,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,934 - INFO - Going to convert document batch...
2025-11-14 15:31:48,936 - INFO - Processing document 4_2024-10-02
2025-11-14 15:31:48,957 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.
2025-11-14 15:31:48,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,000 - INFO - Going to convert document batch...
2025-11-14 15:31:49,001 - INFO - Processing document 4_2024-10-18
2025-11-14 15:31:49,023 - INFO - Finished converting document 4_2024-10-18 in 0.03 sec.


Converted 'data\edgar_documents\AIG\4_2024-08-19' --> 'data\processed_data\AIG\4_2024-08-19.md'
Converted 'data\edgar_documents\AIG\4_2024-09-18' --> 'data\processed_data\AIG\4_2024-09-18.md'
Converted 'data\edgar_documents\AIG\4_2024-10-02' --> 'data\processed_data\AIG\4_2024-10-02.md'


2025-11-14 15:31:49,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,067 - INFO - Going to convert document batch...
2025-11-14 15:31:49,067 - INFO - Processing document 4_2024-11-07
2025-11-14 15:31:49,086 - INFO - Finished converting document 4_2024-11-07 in 0.03 sec.
2025-11-14 15:31:49,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,128 - INFO - Going to convert document batch...
2025-11-14 15:31:49,128 - INFO - Processing document 4_2024-11-12
2025-11-14 15:31:49,146 - INFO - Finished converting document 4_2024-11-12 in 0.03 sec.
2025-11-14 15:31:49,187 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:31:49,187 - ERROR - Input document 4_2024-11-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\AIG\4_2024-10-18' --> 'data\processed_data\AIG\4_2024-10-18.md'
Converted 'data\edgar_documents\AIG\4_2024-11-07' --> 'data\processed_data\AIG\4_2024-11-07.md'
Converted 'data\edgar_documents\AIG\4_2024-11-12' --> 'data\processed_data\AIG\4_2024-11-12.md'
Error processing data\edgar_documents\AIG\4_2024-11-14: File format not allowed: data\edgar_documents\AIG\4_2024-11-14
Error processing data\edgar_documents\AIG\4_2024-11-20: File format not allowed: data\edgar_documents\AIG\4_2024-11-20


2025-11-14 15:31:49,233 - INFO - Processing document 4_2024-11-26
2025-11-14 15:31:49,250 - INFO - Finished converting document 4_2024-11-26 in 0.03 sec.
2025-11-14 15:31:49,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,308 - INFO - Going to convert document batch...
2025-11-14 15:31:49,308 - INFO - Processing document 4_2024-12-03
2025-11-14 15:31:49,328 - INFO - Finished converting document 4_2024-12-03 in 0.06 sec.
2025-11-14 15:31:49,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,386 - INFO - Going to convert document batch...
2025-11-14 15:31:49,386 - INFO - Processing document 4_2024-12-10
2025-11-14 15:31:49,405 - INFO - Finished converting document 4_2024-12-10 in 0.06 sec.
2025-11-14 15:31:49,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2024-11-26' --> 'data\processed_data\AIG\4_2024-11-26.md'
Converted 'data\edgar_documents\AIG\4_2024-12-03' --> 'data\processed_data\AIG\4_2024-12-03.md'
Converted 'data\edgar_documents\AIG\4_2024-12-10' --> 'data\processed_data\AIG\4_2024-12-10.md'


2025-11-14 15:31:49,456 - INFO - Going to convert document batch...
2025-11-14 15:31:49,457 - INFO - Processing document 4_2024-12-11
2025-11-14 15:31:49,478 - INFO - Finished converting document 4_2024-12-11 in 0.03 sec.
2025-11-14 15:31:49,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,532 - INFO - Going to convert document batch...
2025-11-14 15:31:49,533 - INFO - Processing document 4_2024-12-17
2025-11-14 15:31:49,563 - INFO - Finished converting document 4_2024-12-17 in 0.06 sec.
2025-11-14 15:31:49,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,610 - INFO - Going to convert document batch...
2025-11-14 15:31:49,610 - INFO - Processing document 4_2025-01-02
2025-11-14 15:31:49,630 - INFO - Finished converting document 4_2025-01-02 in 0.05 sec.
2025-11-14 15:31:49,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,680 - INFO - Going to convert document batch...
2025-11-14 15:31:49,681 - 

Converted 'data\edgar_documents\AIG\4_2024-12-11' --> 'data\processed_data\AIG\4_2024-12-11.md'
Converted 'data\edgar_documents\AIG\4_2024-12-17' --> 'data\processed_data\AIG\4_2024-12-17.md'
Converted 'data\edgar_documents\AIG\4_2025-01-02' --> 'data\processed_data\AIG\4_2025-01-02.md'


2025-11-14 15:31:49,703 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 15:31:49,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,756 - INFO - Going to convert document batch...
2025-11-14 15:31:49,756 - INFO - Processing document 4_2025-02-18
2025-11-14 15:31:49,773 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 15:31:49,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,830 - INFO - Going to convert document batch...
2025-11-14 15:31:49,830 - INFO - Processing document 4_2025-02-20
2025-11-14 15:31:49,851 - INFO - Finished converting document 4_2025-02-20 in 0.05 sec.
2025-11-14 15:31:49,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,906 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\4_2025-01-03' --> 'data\processed_data\AIG\4_2025-01-03.md'
Converted 'data\edgar_documents\AIG\4_2025-02-18' --> 'data\processed_data\AIG\4_2025-02-18.md'
Converted 'data\edgar_documents\AIG\4_2025-02-20' --> 'data\processed_data\AIG\4_2025-02-20.md'


2025-11-14 15:31:49,906 - INFO - Processing document 4_2025-02-21
2025-11-14 15:31:49,926 - INFO - Finished converting document 4_2025-02-21 in 0.05 sec.
2025-11-14 15:31:49,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,982 - INFO - Going to convert document batch...
2025-11-14 15:31:49,982 - INFO - Processing document 4_2025-02-25
2025-11-14 15:31:50,008 - INFO - Finished converting document 4_2025-02-25 in 0.06 sec.
2025-11-14 15:31:50,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,066 - INFO - Going to convert document batch...
2025-11-14 15:31:50,067 - INFO - Processing document 4_2025-03-05
2025-11-14 15:31:50,091 - INFO - Finished converting document 4_2025-03-05 in 0.06 sec.
2025-11-14 15:31:50,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2025-02-21' --> 'data\processed_data\AIG\4_2025-02-21.md'
Converted 'data\edgar_documents\AIG\4_2025-02-25' --> 'data\processed_data\AIG\4_2025-02-25.md'
Converted 'data\edgar_documents\AIG\4_2025-03-05' --> 'data\processed_data\AIG\4_2025-03-05.md'


2025-11-14 15:31:50,149 - INFO - Going to convert document batch...
2025-11-14 15:31:50,150 - INFO - Processing document 4_2025-04-02
2025-11-14 15:31:50,175 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.
2025-11-14 15:31:50,225 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:31:50,226 - ERROR - Input document 4_2025-05-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:31:50,227 - INFO - Going to convert document batch...
2025-11-14 15:31:50,240 - IN

Converted 'data\edgar_documents\AIG\4_2025-04-02' --> 'data\processed_data\AIG\4_2025-04-02.md'
Error processing data\edgar_documents\AIG\4_2025-05-05: File format not allowed: data\edgar_documents\AIG\4_2025-05-05
Converted 'data\edgar_documents\AIG\4_2025-05-06' --> 'data\processed_data\AIG\4_2025-05-06.md'
Converted 'data\edgar_documents\AIG\4_2025-05-14' --> 'data\processed_data\AIG\4_2025-05-14.md'


2025-11-14 15:31:50,389 - INFO - Processing document 4_2025-05-15
2025-11-14 15:31:50,408 - INFO - Finished converting document 4_2025-05-15 in 0.05 sec.
2025-11-14 15:31:50,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,463 - INFO - Going to convert document batch...
2025-11-14 15:31:50,464 - INFO - Processing document 4_2025-05-20
2025-11-14 15:31:50,489 - INFO - Finished converting document 4_2025-05-20 in 0.06 sec.
2025-11-14 15:31:50,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,550 - INFO - Going to convert document batch...
2025-11-14 15:31:50,551 - INFO - Processing document 4_2025-05-22
2025-11-14 15:31:50,577 - INFO - Finished converting document 4_2025-05-22 in 0.06 sec.


Converted 'data\edgar_documents\AIG\4_2025-05-15' --> 'data\processed_data\AIG\4_2025-05-15.md'
Converted 'data\edgar_documents\AIG\4_2025-05-20' --> 'data\processed_data\AIG\4_2025-05-20.md'
Converted 'data\edgar_documents\AIG\4_2025-05-22' --> 'data\processed_data\AIG\4_2025-05-22.md'


2025-11-14 15:31:50,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,639 - INFO - Going to convert document batch...
2025-11-14 15:31:50,641 - INFO - Processing document 4_2025-06-04
2025-11-14 15:31:50,659 - INFO - Finished converting document 4_2025-06-04 in 0.06 sec.
2025-11-14 15:31:50,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,702 - INFO - Going to convert document batch...
2025-11-14 15:31:50,703 - INFO - Processing document 4_2025-06-17
2025-11-14 15:31:50,725 - INFO - Finished converting document 4_2025-06-17 in 0.05 sec.
2025-11-14 15:31:50,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,778 - INFO - Going to convert document batch...
2025-11-14 15:31:50,779 - INFO - Processing document 4_2025-06-30
2025-11-14 15:31:50,798 - INFO - Finished converting document 4_2025-06-30 in 0.05 sec.
2025-11-14 15:31:50,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AIG\4_2025-06-04' --> 'data\processed_data\AIG\4_2025-06-04.md'
Converted 'data\edgar_documents\AIG\4_2025-06-17' --> 'data\processed_data\AIG\4_2025-06-17.md'
Converted 'data\edgar_documents\AIG\4_2025-06-30' --> 'data\processed_data\AIG\4_2025-06-30.md'


2025-11-14 15:31:50,858 - INFO - Processing document 4_2025-07-03
2025-11-14 15:31:50,882 - INFO - Finished converting document 4_2025-07-03 in 0.05 sec.
2025-11-14 15:31:50,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,937 - INFO - Going to convert document batch...
2025-11-14 15:31:50,937 - INFO - Processing document 4_2025-08-07
2025-11-14 15:31:50,956 - INFO - Finished converting document 4_2025-08-07 in 0.05 sec.
2025-11-14 15:31:50,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,005 - INFO - Going to convert document batch...
2025-11-14 15:31:51,005 - INFO - Processing document 4_2025-08-08
2025-11-14 15:31:51,021 - INFO - Finished converting document 4_2025-08-08 in 0.05 sec.
2025-11-14 15:31:51,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,059 - INFO - Going to convert document batch...
2025-11-14 15:31:51,060 - INFO - Processing document 4_2025-08-19
2025-11-14 15:31:51,079 - IN

Converted 'data\edgar_documents\AIG\4_2025-07-03' --> 'data\processed_data\AIG\4_2025-07-03.md'
Converted 'data\edgar_documents\AIG\4_2025-08-07' --> 'data\processed_data\AIG\4_2025-08-07.md'
Converted 'data\edgar_documents\AIG\4_2025-08-08' --> 'data\processed_data\AIG\4_2025-08-08.md'


2025-11-14 15:31:51,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,130 - INFO - Going to convert document batch...
2025-11-14 15:31:51,131 - INFO - Processing document 4_2025-09-08
2025-11-14 15:31:51,148 - INFO - Finished converting document 4_2025-09-08 in 0.05 sec.
2025-11-14 15:31:51,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,224 - INFO - Going to convert document batch...
2025-11-14 15:31:51,224 - INFO - Processing document 4_2025-10-01
2025-11-14 15:31:51,248 - INFO - Finished converting document 4_2025-10-01 in 0.08 sec.
2025-11-14 15:31:51,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2025-08-19' --> 'data\processed_data\AIG\4_2025-08-19.md'
Converted 'data\edgar_documents\AIG\4_2025-09-08' --> 'data\processed_data\AIG\4_2025-09-08.md'
Converted 'data\edgar_documents\AIG\4_2025-10-01' --> 'data\processed_data\AIG\4_2025-10-01.md'


2025-11-14 15:31:51,493 - INFO - Going to convert document batch...
2025-11-14 15:31:51,493 - INFO - Processing document 4_2025-10-03
2025-11-14 15:31:51,512 - INFO - Finished converting document 4_2025-10-03 in 0.25 sec.
2025-11-14 15:31:51,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,556 - INFO - Going to convert document batch...
2025-11-14 15:31:51,557 - INFO - Processing document 4_2025-10-17
2025-11-14 15:31:51,579 - INFO - Finished converting document 4_2025-10-17 in 0.05 sec.
2025-11-14 15:31:51,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,628 - INFO - Going to convert document batch...
2025-11-14 15:31:51,629 - INFO - Processing document 4_2025-10-22
2025-11-14 15:31:51,648 - INFO - Finished converting document 4_2025-10-22 in 0.05 sec.
2025-11-14 15:31:51,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,697 - INFO - Going to convert document batch...
2025-11-14 15:31:51,698 - 

Converted 'data\edgar_documents\AIG\4_2025-10-03' --> 'data\processed_data\AIG\4_2025-10-03.md'
Converted 'data\edgar_documents\AIG\4_2025-10-17' --> 'data\processed_data\AIG\4_2025-10-17.md'
Converted 'data\edgar_documents\AIG\4_2025-10-22' --> 'data\processed_data\AIG\4_2025-10-22.md'


2025-11-14 15:31:51,715 - INFO - Finished converting document 4_2025-11-05 in 0.05 sec.
2025-11-14 15:31:51,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,766 - INFO - Going to convert document batch...
2025-11-14 15:31:51,767 - INFO - Processing document 8-K_2023-01-10
2025-11-14 15:31:51,786 - INFO - Finished converting document 8-K_2023-01-10 in 0.05 sec.
2025-11-14 15:31:51,820 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,831 - INFO - Going to convert document batch...
2025-11-14 15:31:51,832 - INFO - Processing document 8-K_2023-01-23
2025-11-14 15:31:51,852 - INFO - Finished converting document 8-K_2023-01-23 in 0.05 sec.
2025-11-14 15:31:51,889 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,903 - INFO - Going to convert document batch...
2025-11-14 15:31:51,904 - INFO - Processing document 8-K_2023-01-30
2025-11-14 15:31:51,927 - INFO - Finished converting document 8-K_2023-01-30 in 0.06

Converted 'data\edgar_documents\AIG\4_2025-11-05' --> 'data\processed_data\AIG\4_2025-11-05.md'
Converted 'data\edgar_documents\AIG\8-K_2023-01-10' --> 'data\processed_data\AIG\8-K_2023-01-10.md'
Converted 'data\edgar_documents\AIG\8-K_2023-01-23' --> 'data\processed_data\AIG\8-K_2023-01-23.md'


2025-11-14 15:31:51,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,974 - INFO - Going to convert document batch...
2025-11-14 15:31:51,975 - INFO - Processing document 8-K_2023-02-15
2025-11-14 15:31:51,996 - INFO - Finished converting document 8-K_2023-02-15 in 0.06 sec.
2025-11-14 15:31:52,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,044 - INFO - Going to convert document batch...
2025-11-14 15:31:52,045 - INFO - Processing document 8-K_2023-02-27
2025-11-14 15:31:52,071 - INFO - Finished converting document 8-K_2023-02-27 in 0.05 sec.
2025-11-14 15:31:52,114 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,127 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2023-01-30' --> 'data\processed_data\AIG\8-K_2023-01-30.md'
Converted 'data\edgar_documents\AIG\8-K_2023-02-15' --> 'data\processed_data\AIG\8-K_2023-02-15.md'
Converted 'data\edgar_documents\AIG\8-K_2023-02-27' --> 'data\processed_data\AIG\8-K_2023-02-27.md'


2025-11-14 15:31:52,127 - INFO - Processing document 8-K_2023-03-13
2025-11-14 15:31:52,149 - INFO - Finished converting document 8-K_2023-03-13 in 0.06 sec.
2025-11-14 15:31:52,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,194 - INFO - Going to convert document batch...
2025-11-14 15:31:52,195 - INFO - Processing document 8-K_2023-03-23
2025-11-14 15:31:52,210 - INFO - Finished converting document 8-K_2023-03-23 in 0.05 sec.
2025-11-14 15:31:52,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,251 - INFO - Going to convert document batch...
2025-11-14 15:31:52,251 - INFO - Processing document 8-K_2023-03-27
2025-11-14 15:31:52,290 - INFO - Finished converting document 8-K_2023-03-27 in 0.06 sec.
2025-11-14 15:31:52,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2023-03-13' --> 'data\processed_data\AIG\8-K_2023-03-13.md'
Converted 'data\edgar_documents\AIG\8-K_2023-03-23' --> 'data\processed_data\AIG\8-K_2023-03-23.md'
Converted 'data\edgar_documents\AIG\8-K_2023-03-27' --> 'data\processed_data\AIG\8-K_2023-03-27.md'


2025-11-14 15:31:52,351 - INFO - Going to convert document batch...
2025-11-14 15:31:52,353 - INFO - Processing document 8-K_2023-05-04
2025-11-14 15:31:52,377 - INFO - Finished converting document 8-K_2023-05-04 in 0.06 sec.
2025-11-14 15:31:52,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,433 - INFO - Going to convert document batch...
2025-11-14 15:31:52,434 - INFO - Processing document 8-K_2023-05-15
2025-11-14 15:31:52,461 - INFO - Finished converting document 8-K_2023-05-15 in 0.06 sec.
2025-11-14 15:31:52,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,513 - INFO - Going to convert document batch...
2025-11-14 15:31:52,514 - INFO - Processing document 8-K_2023-05-22
2025-11-14 15:31:52,539 - INFO - Finished converting document 8-K_2023-05-22 in 0.06 sec.
2025-11-14 15:31:52,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2023-05-04' --> 'data\processed_data\AIG\8-K_2023-05-04.md'
Converted 'data\edgar_documents\AIG\8-K_2023-05-15' --> 'data\processed_data\AIG\8-K_2023-05-15.md'
Converted 'data\edgar_documents\AIG\8-K_2023-05-22' --> 'data\processed_data\AIG\8-K_2023-05-22.md'


2025-11-14 15:31:52,598 - INFO - Going to convert document batch...
2025-11-14 15:31:52,598 - INFO - Processing document 8-K_2023-06-23
2025-11-14 15:31:52,623 - INFO - Finished converting document 8-K_2023-06-23 in 0.08 sec.
2025-11-14 15:31:52,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,685 - INFO - Going to convert document batch...
2025-11-14 15:31:52,687 - INFO - Processing document 8-K_2023-08-01
2025-11-14 15:31:52,707 - INFO - Finished converting document 8-K_2023-08-01 in 0.06 sec.
2025-11-14 15:31:52,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,759 - INFO - Going to convert document batch...
2025-11-14 15:31:52,760 - INFO - Processing document 8-K_2023-08-17
2025-11-14 15:31:52,782 - INFO - Finished converting document 8-K_2023-08-17 in 0.06 sec.
2025-11-14 15:31:52,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2023-06-23' --> 'data\processed_data\AIG\8-K_2023-06-23.md'
Converted 'data\edgar_documents\AIG\8-K_2023-08-01' --> 'data\processed_data\AIG\8-K_2023-08-01.md'
Converted 'data\edgar_documents\AIG\8-K_2023-08-17' --> 'data\processed_data\AIG\8-K_2023-08-17.md'


2025-11-14 15:31:52,840 - INFO - Going to convert document batch...
2025-11-14 15:31:52,841 - INFO - Processing document 8-K_2023-09-08
2025-11-14 15:31:52,868 - INFO - Finished converting document 8-K_2023-09-08 in 0.06 sec.
2025-11-14 15:31:52,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,909 - INFO - Going to convert document batch...
2025-11-14 15:31:52,910 - INFO - Processing document 8-K_2023-11-01
2025-11-14 15:31:52,932 - INFO - Finished converting document 8-K_2023-11-01 in 0.03 sec.
2025-11-14 15:31:52,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,999 - INFO - Going to convert document batch...
2025-11-14 15:31:52,999 - INFO - Processing document 8-K_2023-11-06
2025-11-14 15:31:53,020 - INFO - Finished converting document 8-K_2023-11-06 in 0.08 sec.
2025-11-14 15:31:53,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,081 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2023-09-08' --> 'data\processed_data\AIG\8-K_2023-09-08.md'
Converted 'data\edgar_documents\AIG\8-K_2023-11-01' --> 'data\processed_data\AIG\8-K_2023-11-01.md'
Converted 'data\edgar_documents\AIG\8-K_2023-11-06' --> 'data\processed_data\AIG\8-K_2023-11-06.md'


2025-11-14 15:31:53,082 - INFO - Processing document 8-K_2023-11-21
2025-11-14 15:31:53,109 - INFO - Finished converting document 8-K_2023-11-21 in 0.08 sec.
2025-11-14 15:31:53,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,150 - INFO - Going to convert document batch...
2025-11-14 15:31:53,151 - INFO - Processing document 8-K_2023-12-04
2025-11-14 15:31:53,173 - INFO - Finished converting document 8-K_2023-12-04 in 0.05 sec.
2025-11-14 15:31:53,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,214 - INFO - Going to convert document batch...
2025-11-14 15:31:53,215 - INFO - Processing document 8-K_2024-01-31
2025-11-14 15:31:53,244 - INFO - Finished converting document 8-K_2024-01-31 in 0.05 sec.
2025-11-14 15:31:53,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,294 - INFO - Going to convert document batch...
2025-11-14 15:31:53,294 - INFO - Processing document 8-K_2024-02-01


Converted 'data\edgar_documents\AIG\8-K_2023-11-21' --> 'data\processed_data\AIG\8-K_2023-11-21.md'
Converted 'data\edgar_documents\AIG\8-K_2023-12-04' --> 'data\processed_data\AIG\8-K_2023-12-04.md'
Converted 'data\edgar_documents\AIG\8-K_2024-01-31' --> 'data\processed_data\AIG\8-K_2024-01-31.md'


2025-11-14 15:31:53,309 - INFO - Finished converting document 8-K_2024-02-01 in 0.06 sec.
2025-11-14 15:31:53,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,352 - INFO - Going to convert document batch...
2025-11-14 15:31:53,353 - INFO - Processing document 8-K_2024-02-07
2025-11-14 15:31:53,376 - INFO - Finished converting document 8-K_2024-02-07 in 0.06 sec.
2025-11-14 15:31:53,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,422 - INFO - Going to convert document batch...
2025-11-14 15:31:53,423 - INFO - Processing document 8-K_2024-02-13
2025-11-14 15:31:53,445 - INFO - Finished converting document 8-K_2024-02-13 in 0.05 sec.
2025-11-14 15:31:53,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,496 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2024-02-01' --> 'data\processed_data\AIG\8-K_2024-02-01.md'
Converted 'data\edgar_documents\AIG\8-K_2024-02-07' --> 'data\processed_data\AIG\8-K_2024-02-07.md'
Converted 'data\edgar_documents\AIG\8-K_2024-02-13' --> 'data\processed_data\AIG\8-K_2024-02-13.md'


2025-11-14 15:31:53,496 - INFO - Processing document 8-K_2024-04-22
2025-11-14 15:31:53,512 - INFO - Finished converting document 8-K_2024-04-22 in 0.06 sec.
2025-11-14 15:31:53,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,542 - INFO - Going to convert document batch...
2025-11-14 15:31:53,543 - INFO - Processing document 8-K_2024-05-01
2025-11-14 15:31:53,565 - INFO - Finished converting document 8-K_2024-05-01 in 0.05 sec.
2025-11-14 15:31:53,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,611 - INFO - Going to convert document batch...
2025-11-14 15:31:53,612 - INFO - Processing document 8-K_2024-05-16
2025-11-14 15:31:53,636 - INFO - Finished converting document 8-K_2024-05-16 in 0.06 sec.
2025-11-14 15:31:53,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,694 - INFO - Going to convert document batch...
2025-11-14 15:31:53,695 - INFO - Processing document 8-K_2024-05-17


Converted 'data\edgar_documents\AIG\8-K_2024-04-22' --> 'data\processed_data\AIG\8-K_2024-04-22.md'
Converted 'data\edgar_documents\AIG\8-K_2024-05-01' --> 'data\processed_data\AIG\8-K_2024-05-01.md'
Converted 'data\edgar_documents\AIG\8-K_2024-05-16' --> 'data\processed_data\AIG\8-K_2024-05-16.md'


2025-11-14 15:31:53,736 - INFO - Finished converting document 8-K_2024-05-17 in 0.08 sec.
2025-11-14 15:31:53,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,815 - INFO - Going to convert document batch...
2025-11-14 15:31:53,816 - INFO - Processing document 8-K_2024-06-10
2025-11-14 15:31:53,839 - INFO - Finished converting document 8-K_2024-06-10 in 0.08 sec.
2025-11-14 15:31:53,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,894 - INFO - Going to convert document batch...
2025-11-14 15:31:53,894 - INFO - Processing document 8-K_2024-06-13
2025-11-14 15:31:53,919 - INFO - Finished converting document 8-K_2024-06-13 in 0.08 sec.
2025-11-14 15:31:53,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,954 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2024-05-17' --> 'data\processed_data\AIG\8-K_2024-05-17.md'
Converted 'data\edgar_documents\AIG\8-K_2024-06-10' --> 'data\processed_data\AIG\8-K_2024-06-10.md'
Converted 'data\edgar_documents\AIG\8-K_2024-06-13' --> 'data\processed_data\AIG\8-K_2024-06-13.md'


2025-11-14 15:31:53,955 - INFO - Processing document 8-K_2024-06-25
2025-11-14 15:31:53,975 - INFO - Finished converting document 8-K_2024-06-25 in 0.05 sec.
2025-11-14 15:31:54,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,031 - INFO - Going to convert document batch...
2025-11-14 15:31:54,031 - INFO - Processing document 8-K_2024-07-31
2025-11-14 15:31:54,053 - INFO - Finished converting document 8-K_2024-07-31 in 0.06 sec.
2025-11-14 15:31:54,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,104 - INFO - Going to convert document batch...
2025-11-14 15:31:54,105 - INFO - Processing document 8-K_2024-09-03
2025-11-14 15:31:54,125 - INFO - Finished converting document 8-K_2024-09-03 in 0.06 sec.
2025-11-14 15:31:54,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2024-06-25' --> 'data\processed_data\AIG\8-K_2024-06-25.md'
Converted 'data\edgar_documents\AIG\8-K_2024-07-31' --> 'data\processed_data\AIG\8-K_2024-07-31.md'
Converted 'data\edgar_documents\AIG\8-K_2024-09-03' --> 'data\processed_data\AIG\8-K_2024-09-03.md'


2025-11-14 15:31:54,182 - INFO - Going to convert document batch...
2025-11-14 15:31:54,183 - INFO - Processing document 8-K_2024-09-18
2025-11-14 15:31:54,205 - INFO - Finished converting document 8-K_2024-09-18 in 0.06 sec.
2025-11-14 15:31:54,244 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,256 - INFO - Going to convert document batch...
2025-11-14 15:31:54,257 - INFO - Processing document 8-K_2024-09-27
2025-11-14 15:31:54,275 - INFO - Finished converting document 8-K_2024-09-27 in 0.05 sec.
2025-11-14 15:31:54,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,324 - INFO - Going to convert document batch...
2025-11-14 15:31:54,325 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:31:54,339 - INFO - Finished converting document 8-K_2024-10-11 in 0.06 sec.
2025-11-14 15:31:54,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,401 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2024-09-18' --> 'data\processed_data\AIG\8-K_2024-09-18.md'
Converted 'data\edgar_documents\AIG\8-K_2024-09-27' --> 'data\processed_data\AIG\8-K_2024-09-27.md'
Converted 'data\edgar_documents\AIG\8-K_2024-10-11' --> 'data\processed_data\AIG\8-K_2024-10-11.md'


2025-11-14 15:31:54,401 - INFO - Processing document 8-K_2024-10-21
2025-11-14 15:31:54,423 - INFO - Finished converting document 8-K_2024-10-21 in 0.08 sec.
2025-11-14 15:31:54,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,471 - INFO - Going to convert document batch...
2025-11-14 15:31:54,472 - INFO - Processing document 8-K_2024-11-04
2025-11-14 15:31:54,491 - INFO - Finished converting document 8-K_2024-11-04 in 0.05 sec.
2025-11-14 15:31:54,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,529 - INFO - Going to convert document batch...
2025-11-14 15:31:54,529 - INFO - Processing document 8-K_2024-11-08
2025-11-14 15:31:54,549 - INFO - Finished converting document 8-K_2024-11-08 in 0.05 sec.
2025-11-14 15:31:54,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,600 - INFO - Going to convert document batch...
2025-11-14 15:31:54,602 - INFO - Processing document 8-K_2024-11-27


Converted 'data\edgar_documents\AIG\8-K_2024-10-21' --> 'data\processed_data\AIG\8-K_2024-10-21.md'
Converted 'data\edgar_documents\AIG\8-K_2024-11-04' --> 'data\processed_data\AIG\8-K_2024-11-04.md'
Converted 'data\edgar_documents\AIG\8-K_2024-11-08' --> 'data\processed_data\AIG\8-K_2024-11-08.md'


2025-11-14 15:31:54,668 - INFO - Finished converting document 8-K_2024-11-27 in 0.11 sec.
2025-11-14 15:31:54,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,721 - INFO - Going to convert document batch...
2025-11-14 15:31:54,722 - INFO - Processing document 8-K_2024-12-06
2025-11-14 15:31:54,741 - INFO - Finished converting document 8-K_2024-12-06 in 0.05 sec.
2025-11-14 15:31:54,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,794 - INFO - Going to convert document batch...
2025-11-14 15:31:54,795 - INFO - Processing document 8-K_2024-12-13
2025-11-14 15:31:54,815 - INFO - Finished converting document 8-K_2024-12-13 in 0.06 sec.
2025-11-14 15:31:54,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,861 - INFO - Going to convert document batch...
2025-11-14 15:31:54,861 - INFO - Processing document 8-K_2025-02-11
2025-11-14 15:31:54,882 - INFO - Finished converting document 8-K_2025-02-11 in 0.

Converted 'data\edgar_documents\AIG\8-K_2024-11-27' --> 'data\processed_data\AIG\8-K_2024-11-27.md'
Converted 'data\edgar_documents\AIG\8-K_2024-12-06' --> 'data\processed_data\AIG\8-K_2024-12-06.md'
Converted 'data\edgar_documents\AIG\8-K_2024-12-13' --> 'data\processed_data\AIG\8-K_2024-12-13.md'


2025-11-14 15:31:54,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,927 - INFO - Going to convert document batch...
2025-11-14 15:31:54,927 - INFO - Processing document 8-K_2025-02-20
2025-11-14 15:31:54,948 - INFO - Finished converting document 8-K_2025-02-20 in 0.05 sec.
2025-11-14 15:31:54,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,986 - INFO - Going to convert document batch...
2025-11-14 15:31:54,987 - INFO - Processing document 8-K_2025-03-31
2025-11-14 15:31:55,007 - INFO - Finished converting document 8-K_2025-03-31 in 0.05 sec.
2025-11-14 15:31:55,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,081 - INFO - Going to convert document batch...
2025-11-14 15:31:55,081 - INFO - Processing document 8-K_2025-05-01
2025-11-14 15:31:55,099 - INFO - Finished converting document 8-K_2025-05-01 in 0.08 sec.


Converted 'data\edgar_documents\AIG\8-K_2025-02-11' --> 'data\processed_data\AIG\8-K_2025-02-11.md'
Converted 'data\edgar_documents\AIG\8-K_2025-02-20' --> 'data\processed_data\AIG\8-K_2025-02-20.md'
Converted 'data\edgar_documents\AIG\8-K_2025-03-31' --> 'data\processed_data\AIG\8-K_2025-03-31.md'


2025-11-14 15:31:55,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,180 - INFO - Going to convert document batch...
2025-11-14 15:31:55,181 - INFO - Processing document 8-K_2025-05-07
2025-11-14 15:31:55,213 - INFO - Finished converting document 8-K_2025-05-07 in 0.11 sec.
2025-11-14 15:31:55,257 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,268 - INFO - Going to convert document batch...
2025-11-14 15:31:55,269 - INFO - Processing document 8-K_2025-05-15


Converted 'data\edgar_documents\AIG\8-K_2025-05-01' --> 'data\processed_data\AIG\8-K_2025-05-01.md'
Converted 'data\edgar_documents\AIG\8-K_2025-05-07' --> 'data\processed_data\AIG\8-K_2025-05-07.md'


2025-11-14 15:31:55,522 - INFO - Finished converting document 8-K_2025-05-15 in 0.28 sec.
2025-11-14 15:31:55,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,568 - INFO - Going to convert document batch...
2025-11-14 15:31:55,569 - INFO - Processing document 8-K_2025-05-16
2025-11-14 15:31:55,597 - INFO - Finished converting document 8-K_2025-05-16 in 0.06 sec.
2025-11-14 15:31:55,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,640 - INFO - Going to convert document batch...
2025-11-14 15:31:55,641 - INFO - Processing document 8-K_2025-06-02
2025-11-14 15:31:55,660 - INFO - Finished converting document 8-K_2025-06-02 in 0.05 sec.
2025-11-14 15:31:55,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,703 - INFO - Going to convert document batch...
2025-11-14 15:31:55,703 - INFO - Processing document 8-K_2025-06-09
2025-11-14 15:31:55,725 - INFO - Finished converting document 8-K_2025-06-09 in 0.

Converted 'data\edgar_documents\AIG\8-K_2025-05-15' --> 'data\processed_data\AIG\8-K_2025-05-15.md'
Converted 'data\edgar_documents\AIG\8-K_2025-05-16' --> 'data\processed_data\AIG\8-K_2025-05-16.md'
Converted 'data\edgar_documents\AIG\8-K_2025-06-02' --> 'data\processed_data\AIG\8-K_2025-06-02.md'


2025-11-14 15:31:55,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,777 - INFO - Going to convert document batch...
2025-11-14 15:31:55,778 - INFO - Processing document 8-K_2025-07-21
2025-11-14 15:31:55,798 - INFO - Finished converting document 8-K_2025-07-21 in 0.06 sec.
2025-11-14 15:31:55,820 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,828 - INFO - Going to convert document batch...
2025-11-14 15:31:55,829 - INFO - Processing document 8-K_2025-08-06
2025-11-14 15:31:55,846 - INFO - Finished converting document 8-K_2025-08-06 in 0.03 sec.
2025-11-14 15:31:55,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,899 - INFO - Going to convert document batch...
2025-11-14 15:31:55,901 - INFO - Processing document 8-K_2025-08-18
2025-11-14 15:31:55,925 - INFO - Finished converting document 8-K_2025-08-18 in 0.06 sec.


Converted 'data\edgar_documents\AIG\8-K_2025-06-09' --> 'data\processed_data\AIG\8-K_2025-06-09.md'
Converted 'data\edgar_documents\AIG\8-K_2025-07-21' --> 'data\processed_data\AIG\8-K_2025-07-21.md'
Converted 'data\edgar_documents\AIG\8-K_2025-08-06' --> 'data\processed_data\AIG\8-K_2025-08-06.md'


2025-11-14 15:31:55,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,957 - INFO - Going to convert document batch...
2025-11-14 15:31:55,957 - INFO - Processing document 8-K_2025-10-03
2025-11-14 15:31:55,971 - INFO - Finished converting document 8-K_2025-10-03 in 0.03 sec.
2025-11-14 15:31:55,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,999 - INFO - Going to convert document batch...
2025-11-14 15:31:56,000 - INFO - Processing document 8-K_2025-11-04
2025-11-14 15:31:56,017 - INFO - Finished converting document 8-K_2025-11-04 in 0.05 sec.
2025-11-14 15:31:56,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2025-08-18' --> 'data\processed_data\AIG\8-K_2025-08-18.md'
Converted 'data\edgar_documents\AIG\8-K_2025-10-03' --> 'data\processed_data\AIG\8-K_2025-10-03.md'
Converted 'data\edgar_documents\AIG\8-K_2025-11-04' --> 'data\processed_data\AIG\8-K_2025-11-04.md'


2025-11-14 15:31:56,474 - INFO - Going to convert document batch...
2025-11-14 15:31:56,475 - INFO - Processing document DEF-14A_2023-03-29
2025-11-14 15:31:58,133 - INFO - Finished converting document DEF-14A_2023-03-29 in 2.09 sec.
2025-11-14 15:31:59,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\DEF-14A_2023-03-29' --> 'data\processed_data\AIG\DEF-14A_2023-03-29.md'


2025-11-14 15:31:59,533 - INFO - Going to convert document batch...
2025-11-14 15:31:59,535 - INFO - Processing document DEF-14A_2024-04-02
2025-11-14 15:32:01,596 - INFO - Finished converting document DEF-14A_2024-04-02 in 2.64 sec.
2025-11-14 15:32:02,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\DEF-14A_2024-04-02' --> 'data\processed_data\AIG\DEF-14A_2024-04-02.md'


2025-11-14 15:32:03,108 - INFO - Going to convert document batch...
2025-11-14 15:32:03,109 - INFO - Processing document DEF-14A_2025-04-02
2025-11-14 15:32:04,846 - INFO - Finished converting document DEF-14A_2025-04-02 in 2.50 sec.
2025-11-14 15:32:05,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\DEF-14A_2025-04-02' --> 'data\processed_data\AIG\DEF-14A_2025-04-02.md'
Processed 158 new files. Errors: 6
Found 147 files to process in data\edgar_documents\AMD


2025-11-14 15:32:06,318 - INFO - Going to convert document batch...
2025-11-14 15:32:06,319 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:32:06,319 - INFO - Processing document 10-K_2023-02-27
2025-11-14 15:32:07,495 - INFO - Finished converting document 10-K_2023-02-27 in 1.98 sec.
2025-11-14 15:32:08,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-K_2023-02-27' --> 'data\processed_data\AMD\10-K_2023-02-27.md'


2025-11-14 15:32:08,494 - INFO - Going to convert document batch...
2025-11-14 15:32:08,494 - INFO - Processing document 10-K_2024-01-31
2025-11-14 15:32:09,664 - INFO - Finished converting document 10-K_2024-01-31 in 1.66 sec.
2025-11-14 15:32:10,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-K_2024-01-31' --> 'data\processed_data\AMD\10-K_2024-01-31.md'


2025-11-14 15:32:10,560 - INFO - Going to convert document batch...
2025-11-14 15:32:10,561 - INFO - Processing document 10-K_2025-02-05
2025-11-14 15:32:11,470 - INFO - Finished converting document 10-K_2025-02-05 in 1.36 sec.
2025-11-14 15:32:12,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-K_2025-02-05' --> 'data\processed_data\AMD\10-K_2025-02-05.md'


2025-11-14 15:32:12,602 - INFO - Going to convert document batch...
2025-11-14 15:32:12,603 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 15:32:13,184 - INFO - Finished converting document 10-Q_2023-05-03 in 1.19 sec.
2025-11-14 15:32:13,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2023-05-03' --> 'data\processed_data\AMD\10-Q_2023-05-03.md'


2025-11-14 15:32:13,784 - INFO - Going to convert document batch...
2025-11-14 15:32:13,785 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 15:32:14,295 - INFO - Finished converting document 10-Q_2023-08-02 in 0.84 sec.
2025-11-14 15:32:14,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2023-08-02' --> 'data\processed_data\AMD\10-Q_2023-08-02.md'


2025-11-14 15:32:14,839 - INFO - Going to convert document batch...
2025-11-14 15:32:14,840 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 15:32:15,481 - INFO - Finished converting document 10-Q_2023-11-01 in 0.95 sec.
2025-11-14 15:32:15,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2023-11-01' --> 'data\processed_data\AMD\10-Q_2023-11-01.md'


2025-11-14 15:32:16,291 - INFO - Going to convert document batch...
2025-11-14 15:32:16,292 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 15:32:16,751 - INFO - Finished converting document 10-Q_2024-05-01 in 1.02 sec.
2025-11-14 15:32:16,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2024-05-01' --> 'data\processed_data\AMD\10-Q_2024-05-01.md'


2025-11-14 15:32:17,253 - INFO - Going to convert document batch...
2025-11-14 15:32:17,254 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 15:32:17,783 - INFO - Finished converting document 10-Q_2024-07-31 in 0.81 sec.
2025-11-14 15:32:18,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2024-07-31' --> 'data\processed_data\AMD\10-Q_2024-07-31.md'


2025-11-14 15:32:18,425 - INFO - Going to convert document batch...
2025-11-14 15:32:18,426 - INFO - Processing document 10-Q_2024-10-30
2025-11-14 15:32:19,188 - INFO - Finished converting document 10-Q_2024-10-30 in 1.14 sec.
2025-11-14 15:32:19,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2024-10-30' --> 'data\processed_data\AMD\10-Q_2024-10-30.md'


2025-11-14 15:32:19,692 - INFO - Going to convert document batch...
2025-11-14 15:32:19,694 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 15:32:20,135 - INFO - Finished converting document 10-Q_2025-05-07 in 0.69 sec.
2025-11-14 15:32:20,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2025-05-07' --> 'data\processed_data\AMD\10-Q_2025-05-07.md'


2025-11-14 15:32:20,689 - INFO - Going to convert document batch...
2025-11-14 15:32:20,689 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 15:32:21,233 - INFO - Finished converting document 10-Q_2025-08-06 in 0.86 sec.
2025-11-14 15:32:21,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2025-08-06' --> 'data\processed_data\AMD\10-Q_2025-08-06.md'


2025-11-14 15:32:22,154 - INFO - Going to convert document batch...
2025-11-14 15:32:22,155 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 15:32:22,702 - INFO - Finished converting document 10-Q_2025-11-05 in 1.19 sec.
2025-11-14 15:32:22,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:22,986 - INFO - Going to convert document batch...
2025-11-14 15:32:22,987 - INFO - Processing document 4_2023-01-18
2025-11-14 15:32:23,008 - INFO - Finished converting document 4_2023-01-18 in 0.05 sec.
2025-11-14 15:32:23,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,068 - INFO - Going to convert document batch...
2025-11-14 15:32:23,069 - INFO - Processing document 4_2023-02-08
2025-11-14 15:32:23,092 - INFO - Finished converting document 4_2023-02-08 in 0.06 sec.
2025-11-14 15:32:23,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2025-11-05' --> 'data\processed_data\AMD\10-Q_2025-11-05.md'
Converted 'data\edgar_documents\AMD\4_2023-01-18' --> 'data\processed_data\AMD\4_2023-01-18.md'
Converted 'data\edgar_documents\AMD\4_2023-02-08' --> 'data\processed_data\AMD\4_2023-02-08.md'


2025-11-14 15:32:23,152 - INFO - Going to convert document batch...
2025-11-14 15:32:23,153 - INFO - Processing document 4_2023-02-13
2025-11-14 15:32:23,171 - INFO - Finished converting document 4_2023-02-13 in 0.06 sec.
2025-11-14 15:32:23,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,228 - INFO - Going to convert document batch...
2025-11-14 15:32:23,229 - INFO - Processing document 4_2023-02-16
2025-11-14 15:32:23,252 - INFO - Finished converting document 4_2023-02-16 in 0.06 sec.
2025-11-14 15:32:23,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,301 - INFO - Going to convert document batch...
2025-11-14 15:32:23,302 - INFO - Processing document 4_2023-02-17
2025-11-14 15:32:23,322 - INFO - Finished converting document 4_2023-02-17 in 0.05 sec.
2025-11-14 15:32:23,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-02-13' --> 'data\processed_data\AMD\4_2023-02-13.md'
Converted 'data\edgar_documents\AMD\4_2023-02-16' --> 'data\processed_data\AMD\4_2023-02-16.md'
Converted 'data\edgar_documents\AMD\4_2023-02-17' --> 'data\processed_data\AMD\4_2023-02-17.md'


2025-11-14 15:32:23,382 - INFO - Going to convert document batch...
2025-11-14 15:32:23,383 - INFO - Processing document 4_2023-03-08
2025-11-14 15:32:23,419 - INFO - Finished converting document 4_2023-03-08 in 0.08 sec.
2025-11-14 15:32:23,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,541 - INFO - Going to convert document batch...
2025-11-14 15:32:23,542 - INFO - Processing document 4_2023-03-09
2025-11-14 15:32:23,635 - INFO - Finished converting document 4_2023-03-09 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2023-03-08' --> 'data\processed_data\AMD\4_2023-03-08.md'


2025-11-14 15:32:23,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,781 - INFO - Going to convert document batch...
2025-11-14 15:32:23,782 - INFO - Processing document 4_2023-03-17
2025-11-14 15:32:23,858 - INFO - Finished converting document 4_2023-03-17 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2023-03-09' --> 'data\processed_data\AMD\4_2023-03-09.md'


2025-11-14 15:32:23,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,958 - INFO - Going to convert document batch...
2025-11-14 15:32:23,959 - INFO - Processing document 4_2023-03-20
2025-11-14 15:32:24,024 - INFO - Finished converting document 4_2023-03-20 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2023-03-17' --> 'data\processed_data\AMD\4_2023-03-17.md'
Converted 'data\edgar_documents\AMD\4_2023-03-20' --> 'data\processed_data\AMD\4_2023-03-20.md'


2025-11-14 15:32:24,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,146 - INFO - Going to convert document batch...
2025-11-14 15:32:24,147 - INFO - Processing document 4_2023-04-10
2025-11-14 15:32:24,201 - INFO - Finished converting document 4_2023-04-10 in 0.11 sec.
2025-11-14 15:32:24,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,293 - INFO - Going to convert document batch...
2025-11-14 15:32:24,294 - INFO - Processing document 4_2023-04-14
2025-11-14 15:32:24,339 - INFO - Finished converting document 4_2023-04-14 in 0.08 sec.
2025-11-14 15:32:24,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,439 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2023-04-10' --> 'data\processed_data\AMD\4_2023-04-10.md'
Converted 'data\edgar_documents\AMD\4_2023-04-14' --> 'data\processed_data\AMD\4_2023-04-14.md'


2025-11-14 15:32:24,440 - INFO - Processing document 4_2023-04-18
2025-11-14 15:32:24,489 - INFO - Finished converting document 4_2023-04-18 in 0.09 sec.
2025-11-14 15:32:24,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,574 - INFO - Going to convert document batch...
2025-11-14 15:32:24,576 - INFO - Processing document 4_2023-05-09
2025-11-14 15:32:24,644 - INFO - Finished converting document 4_2023-05-09 in 0.11 sec.
2025-11-14 15:32:24,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-04-18' --> 'data\processed_data\AMD\4_2023-04-18.md'
Converted 'data\edgar_documents\AMD\4_2023-05-09' --> 'data\processed_data\AMD\4_2023-05-09.md'


2025-11-14 15:32:24,745 - INFO - Going to convert document batch...
2025-11-14 15:32:24,747 - INFO - Processing document 4_2023-05-17
2025-11-14 15:32:24,792 - INFO - Finished converting document 4_2023-05-17 in 0.09 sec.
2025-11-14 15:32:24,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,882 - INFO - Going to convert document batch...
2025-11-14 15:32:24,883 - INFO - Processing document 4_2023-05-22
2025-11-14 15:32:24,927 - INFO - Finished converting document 4_2023-05-22 in 0.08 sec.
2025-11-14 15:32:24,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,012 - INFO - Going to convert document batch...
2025-11-14 15:32:25,013 - INFO - Processing document 4_2023-05-25


Converted 'data\edgar_documents\AMD\4_2023-05-17' --> 'data\processed_data\AMD\4_2023-05-17.md'
Converted 'data\edgar_documents\AMD\4_2023-05-22' --> 'data\processed_data\AMD\4_2023-05-22.md'


2025-11-14 15:32:25,068 - INFO - Finished converting document 4_2023-05-25 in 0.09 sec.
2025-11-14 15:32:25,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,161 - INFO - Going to convert document batch...
2025-11-14 15:32:25,162 - INFO - Processing document 4_2023-05-30
2025-11-14 15:32:25,198 - INFO - Finished converting document 4_2023-05-30 in 0.08 sec.
2025-11-14 15:32:25,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,286 - INFO - Going to convert document batch...
2025-11-14 15:32:25,288 - INFO - Processing document 4_2023-06-07


Converted 'data\edgar_documents\AMD\4_2023-05-25' --> 'data\processed_data\AMD\4_2023-05-25.md'
Converted 'data\edgar_documents\AMD\4_2023-05-30' --> 'data\processed_data\AMD\4_2023-05-30.md'


2025-11-14 15:32:25,350 - INFO - Finished converting document 4_2023-06-07 in 0.09 sec.
2025-11-14 15:32:25,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,497 - INFO - Going to convert document batch...
2025-11-14 15:32:25,498 - INFO - Processing document 4_2023-06-08
2025-11-14 15:32:25,610 - INFO - Finished converting document 4_2023-06-08 in 0.19 sec.


Converted 'data\edgar_documents\AMD\4_2023-06-07' --> 'data\processed_data\AMD\4_2023-06-07.md'


2025-11-14 15:32:25,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,732 - INFO - Going to convert document batch...
2025-11-14 15:32:25,733 - INFO - Processing document 4_2023-06-12
2025-11-14 15:32:25,777 - INFO - Finished converting document 4_2023-06-12 in 0.09 sec.
2025-11-14 15:32:25,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-06-08' --> 'data\processed_data\AMD\4_2023-06-08.md'
Converted 'data\edgar_documents\AMD\4_2023-06-12' --> 'data\processed_data\AMD\4_2023-06-12.md'


2025-11-14 15:32:25,886 - INFO - Going to convert document batch...
2025-11-14 15:32:25,888 - INFO - Processing document 4_2023-06-13
2025-11-14 15:32:25,984 - INFO - Finished converting document 4_2023-06-13 in 0.16 sec.
2025-11-14 15:32:26,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:26,158 - INFO - Going to convert document batch...
2025-11-14 15:32:26,160 - INFO - Processing document 4_2023-07-10
2025-11-14 15:32:26,242 - INFO - Finished converting document 4_2023-07-10 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2023-06-13' --> 'data\processed_data\AMD\4_2023-06-13.md'


2025-11-14 15:32:26,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:26,411 - INFO - Going to convert document batch...
2025-11-14 15:32:26,413 - INFO - Processing document 4_2023-07-14
2025-11-14 15:32:26,493 - INFO - Finished converting document 4_2023-07-14 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2023-07-10' --> 'data\processed_data\AMD\4_2023-07-10.md'


2025-11-14 15:32:26,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:26,661 - INFO - Going to convert document batch...
2025-11-14 15:32:26,662 - INFO - Processing document 4_2023-08-10
2025-11-14 15:32:26,731 - INFO - Finished converting document 4_2023-08-10 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2023-07-14' --> 'data\processed_data\AMD\4_2023-07-14.md'


2025-11-14 15:32:26,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:26,857 - INFO - Going to convert document batch...
2025-11-14 15:32:26,858 - INFO - Processing document 4_2023-08-11
2025-11-14 15:32:26,930 - INFO - Finished converting document 4_2023-08-11 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2023-08-10' --> 'data\processed_data\AMD\4_2023-08-10.md'


2025-11-14 15:32:27,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,048 - INFO - Going to convert document batch...
2025-11-14 15:32:27,049 - INFO - Processing document 4_2023-08-17
2025-11-14 15:32:27,117 - INFO - Finished converting document 4_2023-08-17 in 0.11 sec.
2025-11-14 15:32:27,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-08-11' --> 'data\processed_data\AMD\4_2023-08-11.md'
Converted 'data\edgar_documents\AMD\4_2023-08-17' --> 'data\processed_data\AMD\4_2023-08-17.md'


2025-11-14 15:32:27,214 - INFO - Going to convert document batch...
2025-11-14 15:32:27,216 - INFO - Processing document 4_2023-08-18
2025-11-14 15:32:27,260 - INFO - Finished converting document 4_2023-08-18 in 0.09 sec.
2025-11-14 15:32:27,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,327 - INFO - Going to convert document batch...
2025-11-14 15:32:27,328 - INFO - Processing document 4_2023-08-29
2025-11-14 15:32:27,371 - INFO - Finished converting document 4_2023-08-29 in 0.08 sec.
2025-11-14 15:32:27,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,446 - INFO - Going to convert document batch...
2025-11-14 15:32:27,447 - INFO - Processing document 4_2023-08-30
2025-11-14 15:32:27,507 - INFO - Finished converting document 4_2023-08-30 in 0.09 sec.


Converted 'data\edgar_documents\AMD\4_2023-08-18' --> 'data\processed_data\AMD\4_2023-08-18.md'
Converted 'data\edgar_documents\AMD\4_2023-08-29' --> 'data\processed_data\AMD\4_2023-08-29.md'


2025-11-14 15:32:27,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,630 - INFO - Going to convert document batch...
2025-11-14 15:32:27,631 - INFO - Processing document 4_2023-09-01
2025-11-14 15:32:27,670 - INFO - Finished converting document 4_2023-09-01 in 0.11 sec.
2025-11-14 15:32:27,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-08-30' --> 'data\processed_data\AMD\4_2023-08-30.md'
Converted 'data\edgar_documents\AMD\4_2023-09-01' --> 'data\processed_data\AMD\4_2023-09-01.md'


2025-11-14 15:32:27,784 - INFO - Going to convert document batch...
2025-11-14 15:32:27,786 - INFO - Processing document 4_2023-09-14
2025-11-14 15:32:27,872 - INFO - Finished converting document 4_2023-09-14 in 0.17 sec.
2025-11-14 15:32:27,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,950 - INFO - Going to convert document batch...
2025-11-14 15:32:27,951 - INFO - Processing document 4_2023-11-07
2025-11-14 15:32:27,992 - INFO - Finished converting document 4_2023-11-07 in 0.08 sec.
2025-11-14 15:32:28,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,111 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2023-09-14' --> 'data\processed_data\AMD\4_2023-09-14.md'
Converted 'data\edgar_documents\AMD\4_2023-11-07' --> 'data\processed_data\AMD\4_2023-11-07.md'


2025-11-14 15:32:28,112 - INFO - Processing document 4_2023-11-09
2025-11-14 15:32:28,183 - INFO - Finished converting document 4_2023-11-09 in 0.14 sec.
2025-11-14 15:32:28,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,275 - INFO - Going to convert document batch...
2025-11-14 15:32:28,276 - INFO - Processing document 4_2023-11-29
2025-11-14 15:32:28,349 - INFO - Finished converting document 4_2023-11-29 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2023-11-09' --> 'data\processed_data\AMD\4_2023-11-09.md'


2025-11-14 15:32:28,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,479 - INFO - Going to convert document batch...
2025-11-14 15:32:28,482 - INFO - Processing document 4_2023-12-07
2025-11-14 15:32:28,546 - INFO - Finished converting document 4_2023-12-07 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2023-11-29' --> 'data\processed_data\AMD\4_2023-11-29.md'
Converted 'data\edgar_documents\AMD\4_2023-12-07' --> 'data\processed_data\AMD\4_2023-12-07.md'


2025-11-14 15:32:28,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,669 - INFO - Going to convert document batch...
2025-11-14 15:32:28,670 - INFO - Processing document 4_2023-12-11
2025-11-14 15:32:28,708 - INFO - Finished converting document 4_2023-12-11 in 0.08 sec.
2025-11-14 15:32:28,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,792 - INFO - Going to convert document batch...
2025-11-14 15:32:28,793 - INFO - Processing document 4_2024-01-17


Converted 'data\edgar_documents\AMD\4_2023-12-11' --> 'data\processed_data\AMD\4_2023-12-11.md'


2025-11-14 15:32:29,552 - INFO - Finished converting document 4_2024-01-17 in 0.80 sec.
2025-11-14 15:32:29,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:29,664 - INFO - Going to convert document batch...
2025-11-14 15:32:29,667 - INFO - Processing document 4_2024-02-06
2025-11-14 15:32:29,710 - INFO - Finished converting document 4_2024-02-06 in 0.08 sec.
2025-11-14 15:32:29,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-01-17' --> 'data\processed_data\AMD\4_2024-01-17.md'
Converted 'data\edgar_documents\AMD\4_2024-02-06' --> 'data\processed_data\AMD\4_2024-02-06.md'


2025-11-14 15:32:29,809 - INFO - Going to convert document batch...
2025-11-14 15:32:29,810 - INFO - Processing document 4_2024-02-07
2025-11-14 15:32:29,876 - INFO - Finished converting document 4_2024-02-07 in 0.12 sec.
2025-11-14 15:32:29,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,020 - INFO - Going to convert document batch...
2025-11-14 15:32:30,021 - INFO - Processing document 4_2024-02-16
2025-11-14 15:32:30,110 - INFO - Finished converting document 4_2024-02-16 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2024-02-07' --> 'data\processed_data\AMD\4_2024-02-07.md'
Converted 'data\edgar_documents\AMD\4_2024-02-16' --> 'data\processed_data\AMD\4_2024-02-16.md'


2025-11-14 15:32:30,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,195 - INFO - Going to convert document batch...
2025-11-14 15:32:30,197 - INFO - Processing document 4_2024-02-20
2025-11-14 15:32:30,232 - INFO - Finished converting document 4_2024-02-20 in 0.09 sec.
2025-11-14 15:32:30,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,310 - INFO - Going to convert document batch...
2025-11-14 15:32:30,312 - INFO - Processing document 4_2024-02-23
2025-11-14 15:32:30,386 - INFO - Finished converting document 4_2024-02-23 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2024-02-20' --> 'data\processed_data\AMD\4_2024-02-20.md'


2025-11-14 15:32:30,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,562 - INFO - Going to convert document batch...
2025-11-14 15:32:30,563 - INFO - Processing document 4_2024-03-04
2025-11-14 15:32:30,615 - INFO - Finished converting document 4_2024-03-04 in 0.09 sec.
2025-11-14 15:32:30,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-02-23' --> 'data\processed_data\AMD\4_2024-02-23.md'
Converted 'data\edgar_documents\AMD\4_2024-03-04' --> 'data\processed_data\AMD\4_2024-03-04.md'


2025-11-14 15:32:30,724 - INFO - Going to convert document batch...
2025-11-14 15:32:30,727 - INFO - Processing document 4_2024-03-06
2025-11-14 15:32:30,789 - INFO - Finished converting document 4_2024-03-06 in 0.11 sec.
2025-11-14 15:32:30,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,892 - INFO - Going to convert document batch...
2025-11-14 15:32:30,893 - INFO - Processing document 4_2024-03-07
2025-11-14 15:32:30,972 - INFO - Finished converting document 4_2024-03-07 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2024-03-06' --> 'data\processed_data\AMD\4_2024-03-06.md'


2025-11-14 15:32:31,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,118 - INFO - Going to convert document batch...
2025-11-14 15:32:31,120 - INFO - Processing document 4_2024-03-11
2025-11-14 15:32:31,191 - INFO - Finished converting document 4_2024-03-11 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2024-03-07' --> 'data\processed_data\AMD\4_2024-03-07.md'


2025-11-14 15:32:31,251 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,281 - INFO - Going to convert document batch...
2025-11-14 15:32:31,282 - INFO - Processing document 4_2024-03-15
2025-11-14 15:32:31,352 - INFO - Finished converting document 4_2024-03-15 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2024-03-11' --> 'data\processed_data\AMD\4_2024-03-11.md'


2025-11-14 15:32:31,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,466 - INFO - Going to convert document batch...
2025-11-14 15:32:31,468 - INFO - Processing document 4_2024-03-19
2025-11-14 15:32:31,532 - INFO - Finished converting document 4_2024-03-19 in 0.11 sec.
2025-11-14 15:32:31,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-03-15' --> 'data\processed_data\AMD\4_2024-03-15.md'
Converted 'data\edgar_documents\AMD\4_2024-03-19' --> 'data\processed_data\AMD\4_2024-03-19.md'


2025-11-14 15:32:31,635 - INFO - Going to convert document batch...
2025-11-14 15:32:31,636 - INFO - Processing document 4_2024-04-17
2025-11-14 15:32:31,713 - INFO - Finished converting document 4_2024-04-17 in 0.14 sec.
2025-11-14 15:32:31,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,820 - INFO - Going to convert document batch...
2025-11-14 15:32:31,821 - INFO - Processing document 4_2024-05-10
2025-11-14 15:32:31,877 - INFO - Finished converting document 4_2024-05-10 in 0.09 sec.
2025-11-14 15:32:31,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,965 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2024-04-17' --> 'data\processed_data\AMD\4_2024-04-17.md'
Converted 'data\edgar_documents\AMD\4_2024-05-10' --> 'data\processed_data\AMD\4_2024-05-10.md'


2025-11-14 15:32:31,967 - INFO - Processing document 4_2024-05-17
2025-11-14 15:32:32,017 - INFO - Finished converting document 4_2024-05-17 in 0.09 sec.
2025-11-14 15:32:32,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:32,127 - INFO - Going to convert document batch...
2025-11-14 15:32:32,128 - INFO - Processing document 4_2024-05-21
2025-11-14 15:32:32,182 - INFO - Finished converting document 4_2024-05-21 in 0.12 sec.
2025-11-14 15:32:32,244 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-05-17' --> 'data\processed_data\AMD\4_2024-05-17.md'
Converted 'data\edgar_documents\AMD\4_2024-05-21' --> 'data\processed_data\AMD\4_2024-05-21.md'


2025-11-14 15:32:32,265 - INFO - Going to convert document batch...
2025-11-14 15:32:32,266 - INFO - Processing document 4_2024-06-06
2025-11-14 15:32:32,311 - INFO - Finished converting document 4_2024-06-06 in 0.09 sec.
2025-11-14 15:32:32,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:32,394 - INFO - Going to convert document batch...
2025-11-14 15:32:32,395 - INFO - Processing document 4_2024-06-07
2025-11-14 15:32:32,462 - INFO - Finished converting document 4_2024-06-07 in 0.11 sec.
2025-11-14 15:32:32,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-06-06' --> 'data\processed_data\AMD\4_2024-06-06.md'
Converted 'data\edgar_documents\AMD\4_2024-06-07' --> 'data\processed_data\AMD\4_2024-06-07.md'


2025-11-14 15:32:32,552 - INFO - Going to convert document batch...
2025-11-14 15:32:32,553 - INFO - Processing document 4_2024-06-10
2025-11-14 15:32:32,603 - INFO - Finished converting document 4_2024-06-10 in 0.08 sec.
2025-11-14 15:32:32,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:32,706 - INFO - Going to convert document batch...
2025-11-14 15:32:32,708 - INFO - Processing document 4_2024-06-11
2025-11-14 15:32:32,771 - INFO - Finished converting document 4_2024-06-11 in 0.11 sec.
2025-11-14 15:32:32,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-06-10' --> 'data\processed_data\AMD\4_2024-06-10.md'
Converted 'data\edgar_documents\AMD\4_2024-06-11' --> 'data\processed_data\AMD\4_2024-06-11.md'


2025-11-14 15:32:32,882 - INFO - Going to convert document batch...
2025-11-14 15:32:32,884 - INFO - Processing document 4_2024-06-12
2025-11-14 15:32:32,935 - INFO - Finished converting document 4_2024-06-12 in 0.11 sec.
2025-11-14 15:32:32,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:33,020 - INFO - Going to convert document batch...
2025-11-14 15:32:33,021 - INFO - Processing document 4_2024-06-13
2025-11-14 15:32:33,083 - INFO - Finished converting document 4_2024-06-13 in 0.09 sec.
2025-11-14 15:32:33,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:33,195 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2024-06-12' --> 'data\processed_data\AMD\4_2024-06-12.md'
Converted 'data\edgar_documents\AMD\4_2024-06-13' --> 'data\processed_data\AMD\4_2024-06-13.md'


2025-11-14 15:32:33,197 - INFO - Processing document 4_2024-06-18
2025-11-14 15:32:33,283 - INFO - Finished converting document 4_2024-06-18 in 0.12 sec.
2025-11-14 15:32:33,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:33,389 - INFO - Going to convert document batch...
2025-11-14 15:32:33,390 - INFO - Processing document 4_2024-07-16
2025-11-14 15:32:33,452 - INFO - Finished converting document 4_2024-07-16 in 0.11 sec.
2025-11-14 15:32:33,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-06-18' --> 'data\processed_data\AMD\4_2024-06-18.md'
Converted 'data\edgar_documents\AMD\4_2024-07-16' --> 'data\processed_data\AMD\4_2024-07-16.md'


2025-11-14 15:32:33,584 - INFO - Going to convert document batch...
2025-11-14 15:32:33,587 - INFO - Processing document 4_2024-07-17
2025-11-14 15:32:33,696 - INFO - Finished converting document 4_2024-07-17 in 0.17 sec.
2025-11-14 15:32:33,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:33,774 - INFO - Going to convert document batch...
2025-11-14 15:32:33,775 - INFO - Processing document 4_2024-08-07
2025-11-14 15:32:33,810 - INFO - Finished converting document 4_2024-08-07 in 0.08 sec.
2025-11-14 15:32:33,890 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-07-17' --> 'data\processed_data\AMD\4_2024-07-17.md'
Converted 'data\edgar_documents\AMD\4_2024-08-07' --> 'data\processed_data\AMD\4_2024-08-07.md'


2025-11-14 15:32:33,926 - INFO - Going to convert document batch...
2025-11-14 15:32:33,929 - INFO - Processing document 4_2024-08-13
2025-11-14 15:32:34,028 - INFO - Finished converting document 4_2024-08-13 in 0.16 sec.
2025-11-14 15:32:34,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,182 - INFO - Going to convert document batch...
2025-11-14 15:32:34,184 - INFO - Processing document 4_2024-08-19
2025-11-14 15:32:34,246 - INFO - Finished converting document 4_2024-08-19 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2024-08-13' --> 'data\processed_data\AMD\4_2024-08-13.md'


2025-11-14 15:32:34,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,345 - INFO - Going to convert document batch...
2025-11-14 15:32:34,347 - INFO - Processing document 4_2024-08-22
2025-11-14 15:32:34,423 - INFO - Finished converting document 4_2024-08-22 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2024-08-19' --> 'data\processed_data\AMD\4_2024-08-19.md'


2025-11-14 15:32:34,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,530 - INFO - Going to convert document batch...
2025-11-14 15:32:34,531 - INFO - Processing document 4_2024-09-13
2025-11-14 15:32:34,602 - INFO - Finished converting document 4_2024-09-13 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2024-08-22' --> 'data\processed_data\AMD\4_2024-08-22.md'


2025-11-14 15:32:34,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,746 - INFO - Going to convert document batch...
2025-11-14 15:32:34,747 - INFO - Processing document 4_2024-09-17
2025-11-14 15:32:34,817 - INFO - Finished converting document 4_2024-09-17 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2024-09-13' --> 'data\processed_data\AMD\4_2024-09-13.md'
Converted 'data\edgar_documents\AMD\4_2024-09-17' --> 'data\processed_data\AMD\4_2024-09-17.md'


2025-11-14 15:32:34,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,921 - INFO - Going to convert document batch...
2025-11-14 15:32:34,923 - INFO - Processing document 4_2024-11-05
2025-11-14 15:32:34,989 - INFO - Finished converting document 4_2024-11-05 in 0.12 sec.
2025-11-14 15:32:35,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:35,088 - INFO - Going to convert document batch...
2025-11-14 15:32:35,090 - INFO - Processing document 4_2024-11-07
2025-11-14 15:32:35,150 - INFO - Finished converting document 4_2024-11-07 in 0.09 sec.
2025-11-14 15:32:35,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:35,243 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2024-11-05' --> 'data\processed_data\AMD\4_2024-11-05.md'
Converted 'data\edgar_documents\AMD\4_2024-11-07' --> 'data\processed_data\AMD\4_2024-11-07.md'


2025-11-14 15:32:35,245 - INFO - Processing document 4_2024-11-08
2025-11-14 15:32:35,308 - INFO - Finished converting document 4_2024-11-08 in 0.12 sec.
2025-11-14 15:32:35,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:35,410 - INFO - Going to convert document batch...
2025-11-14 15:32:35,412 - INFO - Processing document 4_2024-12-06
2025-11-14 15:32:35,478 - INFO - Finished converting document 4_2024-12-06 in 0.09 sec.
2025-11-14 15:32:35,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-11-08' --> 'data\processed_data\AMD\4_2024-11-08.md'
Converted 'data\edgar_documents\AMD\4_2024-12-06' --> 'data\processed_data\AMD\4_2024-12-06.md'


2025-11-14 15:32:35,593 - INFO - Going to convert document batch...
2025-11-14 15:32:35,598 - INFO - Processing document 4_2024-12-17
2025-11-14 15:32:35,706 - INFO - Finished converting document 4_2024-12-17 in 0.16 sec.
2025-11-14 15:32:35,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:35,804 - INFO - Going to convert document batch...
2025-11-14 15:32:35,805 - INFO - Processing document 4_2025-01-17
2025-11-14 15:32:35,874 - INFO - Finished converting document 4_2025-01-17 in 0.11 sec.
2025-11-14 15:32:35,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-12-17' --> 'data\processed_data\AMD\4_2024-12-17.md'
Converted 'data\edgar_documents\AMD\4_2025-01-17' --> 'data\processed_data\AMD\4_2025-01-17.md'


2025-11-14 15:32:35,998 - INFO - Going to convert document batch...
2025-11-14 15:32:35,999 - INFO - Processing document 4_2025-02-12
2025-11-14 15:32:36,066 - INFO - Finished converting document 4_2025-02-12 in 0.12 sec.
2025-11-14 15:32:36,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:36,176 - INFO - Going to convert document batch...
2025-11-14 15:32:36,178 - INFO - Processing document 4_2025-02-19
2025-11-14 15:32:36,237 - INFO - Finished converting document 4_2025-02-19 in 0.09 sec.
2025-11-14 15:32:36,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:36,326 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2025-02-12' --> 'data\processed_data\AMD\4_2025-02-12.md'
Converted 'data\edgar_documents\AMD\4_2025-02-19' --> 'data\processed_data\AMD\4_2025-02-19.md'


2025-11-14 15:32:36,328 - INFO - Processing document 4_2025-03-03
2025-11-14 15:32:36,393 - INFO - Finished converting document 4_2025-03-03 in 0.11 sec.
2025-11-14 15:32:36,488 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:32:36,489 - ERROR - Input document 4_2025-03-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:32:36,494 - INFO - Going to convert document batch...
2025-11-14 15:32:36,528 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\AMD\4_2025-03-03' --> 'data\processed_data\AMD\4_2025-03-03.md'
Error processing data\edgar_documents\AMD\4_2025-03-10: File format not allowed: data\edgar_documents\AMD\4_2025-03-10
Error processing data\edgar_documents\AMD\4_2025-03-12: File format not allowed: data\edgar_documents\AMD\4_2025-03-12


2025-11-14 15:32:36,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:36,772 - INFO - Going to convert document batch...
2025-11-14 15:32:36,773 - INFO - Processing document 4_2025-03-18
2025-11-14 15:32:36,838 - INFO - Finished converting document 4_2025-03-18 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2025-03-14' --> 'data\processed_data\AMD\4_2025-03-14.md'


2025-11-14 15:32:36,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:36,971 - INFO - Going to convert document batch...
2025-11-14 15:32:36,973 - INFO - Processing document 4_2025-04-17
2025-11-14 15:32:37,050 - INFO - Finished converting document 4_2025-04-17 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2025-03-18' --> 'data\processed_data\AMD\4_2025-03-18.md'


2025-11-14 15:32:37,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:37,164 - INFO - Going to convert document batch...
2025-11-14 15:32:37,165 - INFO - Processing document 4_2025-05-12
2025-11-14 15:32:37,249 - INFO - Finished converting document 4_2025-05-12 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2025-04-17' --> 'data\processed_data\AMD\4_2025-04-17.md'
Converted 'data\edgar_documents\AMD\4_2025-05-12' --> 'data\processed_data\AMD\4_2025-05-12.md'


2025-11-14 15:32:37,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:37,378 - INFO - Going to convert document batch...
2025-11-14 15:32:37,380 - INFO - Processing document 4_2025-05-16
2025-11-14 15:32:37,451 - INFO - Finished converting document 4_2025-05-16 in 0.14 sec.
2025-11-14 15:32:37,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:37,563 - INFO - Going to convert document batch...
2025-11-14 15:32:37,565 - INFO - Processing document 4_2025-05-19
2025-11-14 15:32:37,635 - INFO - Finished converting document 4_2025-05-19 in 0.11 sec.
2025-11-14 15:32:37,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-05-16' --> 'data\processed_data\AMD\4_2025-05-16.md'
Converted 'data\edgar_documents\AMD\4_2025-05-19' --> 'data\processed_data\AMD\4_2025-05-19.md'


2025-11-14 15:32:37,731 - INFO - Going to convert document batch...
2025-11-14 15:32:37,732 - INFO - Processing document 4_2025-05-22
2025-11-14 15:32:37,786 - INFO - Finished converting document 4_2025-05-22 in 0.09 sec.
2025-11-14 15:32:37,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:37,880 - INFO - Going to convert document batch...
2025-11-14 15:32:37,882 - INFO - Processing document 4_2025-06-13
2025-11-14 15:32:37,952 - INFO - Finished converting document 4_2025-06-13 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2025-05-22' --> 'data\processed_data\AMD\4_2025-05-22.md'
Converted 'data\edgar_documents\AMD\4_2025-06-13' --> 'data\processed_data\AMD\4_2025-06-13.md'


2025-11-14 15:32:38,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:38,125 - INFO - Going to convert document batch...
2025-11-14 15:32:38,128 - INFO - Processing document 4_2025-06-17
2025-11-14 15:32:38,202 - INFO - Finished converting document 4_2025-06-17 in 0.19 sec.
2025-11-14 15:32:38,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-06-17' --> 'data\processed_data\AMD\4_2025-06-17.md'


2025-11-14 15:32:38,756 - INFO - Going to convert document batch...
2025-11-14 15:32:38,757 - INFO - Processing document 4_2025-07-17
2025-11-14 15:32:38,837 - INFO - Finished converting document 4_2025-07-17 in 0.58 sec.
2025-11-14 15:32:38,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:38,958 - INFO - Going to convert document batch...
2025-11-14 15:32:38,960 - INFO - Processing document 4_2025-08-12
2025-11-14 15:32:39,039 - INFO - Finished converting document 4_2025-08-12 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2025-07-17' --> 'data\processed_data\AMD\4_2025-07-17.md'
Converted 'data\edgar_documents\AMD\4_2025-08-12' --> 'data\processed_data\AMD\4_2025-08-12.md'


2025-11-14 15:32:39,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:39,182 - INFO - Going to convert document batch...
2025-11-14 15:32:39,184 - INFO - Processing document 4_2025-08-15
2025-11-14 15:32:39,263 - INFO - Finished converting document 4_2025-08-15 in 0.16 sec.
2025-11-14 15:32:39,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:39,376 - INFO - Going to convert document batch...
2025-11-14 15:32:39,377 - INFO - Processing document 4_2025-08-19
2025-11-14 15:32:39,438 - INFO - Finished converting document 4_2025-08-19 in 0.11 sec.
2025-11-14 15:32:39,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-08-15' --> 'data\processed_data\AMD\4_2025-08-15.md'
Converted 'data\edgar_documents\AMD\4_2025-08-19' --> 'data\processed_data\AMD\4_2025-08-19.md'


2025-11-14 15:32:39,562 - INFO - Going to convert document batch...
2025-11-14 15:32:39,564 - INFO - Processing document 4_2025-08-25
2025-11-14 15:32:39,644 - INFO - Finished converting document 4_2025-08-25 in 0.14 sec.
2025-11-14 15:32:39,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:39,729 - INFO - Going to convert document batch...
2025-11-14 15:32:39,730 - INFO - Processing document 4_2025-09-04
2025-11-14 15:32:39,771 - INFO - Finished converting document 4_2025-09-04 in 0.06 sec.
2025-11-14 15:32:39,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:39,878 - INFO - Going to convert document batch...
2025-11-14 15:32:39,880 - INFO - Processing document 4_2025-09-12


Converted 'data\edgar_documents\AMD\4_2025-08-25' --> 'data\processed_data\AMD\4_2025-08-25.md'
Converted 'data\edgar_documents\AMD\4_2025-09-04' --> 'data\processed_data\AMD\4_2025-09-04.md'


2025-11-14 15:32:39,960 - INFO - Finished converting document 4_2025-09-12 in 0.14 sec.
2025-11-14 15:32:40,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:40,076 - INFO - Going to convert document batch...
2025-11-14 15:32:40,079 - INFO - Processing document 4_2025-09-17
2025-11-14 15:32:40,175 - INFO - Finished converting document 4_2025-09-17 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2025-09-12' --> 'data\processed_data\AMD\4_2025-09-12.md'


2025-11-14 15:32:40,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:40,293 - INFO - Going to convert document batch...
2025-11-14 15:32:40,294 - INFO - Processing document 4_2025-09-26
2025-11-14 15:32:40,348 - INFO - Finished converting document 4_2025-09-26 in 0.11 sec.
2025-11-14 15:32:40,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-09-17' --> 'data\processed_data\AMD\4_2025-09-17.md'
Converted 'data\edgar_documents\AMD\4_2025-09-26' --> 'data\processed_data\AMD\4_2025-09-26.md'


2025-11-14 15:32:40,442 - INFO - Going to convert document batch...
2025-11-14 15:32:40,444 - INFO - Processing document 4_2025-10-08
2025-11-14 15:32:40,515 - INFO - Finished converting document 4_2025-10-08 in 0.11 sec.
2025-11-14 15:32:40,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:40,631 - INFO - Going to convert document batch...
2025-11-14 15:32:40,633 - INFO - Processing document 4_2025-10-17
2025-11-14 15:32:40,691 - INFO - Finished converting document 4_2025-10-17 in 0.11 sec.
2025-11-14 15:32:40,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-10-08' --> 'data\processed_data\AMD\4_2025-10-08.md'
Converted 'data\edgar_documents\AMD\4_2025-10-17' --> 'data\processed_data\AMD\4_2025-10-17.md'


2025-11-14 15:32:40,828 - INFO - Going to convert document batch...
2025-11-14 15:32:40,831 - INFO - Processing document 8-K_2023-01-11
2025-11-14 15:32:40,906 - INFO - Finished converting document 8-K_2023-01-11 in 0.16 sec.
2025-11-14 15:32:40,981 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,027 - INFO - Going to convert document batch...
2025-11-14 15:32:41,030 - INFO - Processing document 8-K_2023-01-31
2025-11-14 15:32:41,086 - INFO - Finished converting document 8-K_2023-01-31 in 0.12 sec.


Converted 'data\edgar_documents\AMD\8-K_2023-01-11' --> 'data\processed_data\AMD\8-K_2023-01-11.md'
Converted 'data\edgar_documents\AMD\8-K_2023-01-31' --> 'data\processed_data\AMD\8-K_2023-01-31.md'


2025-11-14 15:32:41,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,220 - INFO - Going to convert document batch...
2025-11-14 15:32:41,222 - INFO - Processing document 8-K_2023-02-21
2025-11-14 15:32:41,272 - INFO - Finished converting document 8-K_2023-02-21 in 0.12 sec.
2025-11-14 15:32:41,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,348 - INFO - Going to convert document batch...
2025-11-14 15:32:41,349 - INFO - Processing document 8-K_2023-05-02
2025-11-14 15:32:41,377 - INFO - Finished converting document 8-K_2023-05-02 in 0.08 sec.
2025-11-14 15:32:41,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,453 - INFO - Going to convert document batch...
2025-11-14 15:32:41,455 - INFO - Processing document 8-K_2023-05-23


Converted 'data\edgar_documents\AMD\8-K_2023-02-21' --> 'data\processed_data\AMD\8-K_2023-02-21.md'
Converted 'data\edgar_documents\AMD\8-K_2023-05-02' --> 'data\processed_data\AMD\8-K_2023-05-02.md'


2025-11-14 15:32:41,536 - INFO - Finished converting document 8-K_2023-05-23 in 0.14 sec.
2025-11-14 15:32:41,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,650 - INFO - Going to convert document batch...
2025-11-14 15:32:41,651 - INFO - Processing document 8-K_2023-07-10
2025-11-14 15:32:41,699 - INFO - Finished converting document 8-K_2023-07-10 in 0.12 sec.


Converted 'data\edgar_documents\AMD\8-K_2023-05-23' --> 'data\processed_data\AMD\8-K_2023-05-23.md'
Converted 'data\edgar_documents\AMD\8-K_2023-07-10' --> 'data\processed_data\AMD\8-K_2023-07-10.md'


2025-11-14 15:32:41,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,826 - INFO - Going to convert document batch...
2025-11-14 15:32:41,828 - INFO - Processing document 8-K_2023-08-01
2025-11-14 15:32:41,879 - INFO - Finished converting document 8-K_2023-08-01 in 0.12 sec.
2025-11-14 15:32:41,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,976 - INFO - Going to convert document batch...
2025-11-14 15:32:41,980 - INFO - Processing document 8-K_2023-10-31
2025-11-14 15:32:42,034 - INFO - Finished converting document 8-K_2023-10-31 in 0.12 sec.
2025-11-14 15:32:42,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2023-08-01' --> 'data\processed_data\AMD\8-K_2023-08-01.md'
Converted 'data\edgar_documents\AMD\8-K_2023-10-31' --> 'data\processed_data\AMD\8-K_2023-10-31.md'


2025-11-14 15:32:42,124 - INFO - Going to convert document batch...
2025-11-14 15:32:42,130 - INFO - Processing document 8-K_2024-01-30
2025-11-14 15:32:42,207 - INFO - Finished converting document 8-K_2024-01-30 in 0.14 sec.
2025-11-14 15:32:42,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:42,294 - INFO - Going to convert document batch...
2025-11-14 15:32:42,296 - INFO - Processing document 8-K_2024-02-20
2025-11-14 15:32:42,379 - INFO - Finished converting document 8-K_2024-02-20 in 0.14 sec.
2025-11-14 15:32:42,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2024-01-30' --> 'data\processed_data\AMD\8-K_2024-01-30.md'
Converted 'data\edgar_documents\AMD\8-K_2024-02-20' --> 'data\processed_data\AMD\8-K_2024-02-20.md'


2025-11-14 15:32:42,484 - INFO - Going to convert document batch...
2025-11-14 15:32:42,490 - INFO - Processing document 8-K_2024-04-30
2025-11-14 15:32:42,546 - INFO - Finished converting document 8-K_2024-04-30 in 0.14 sec.
2025-11-14 15:32:42,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:42,659 - INFO - Going to convert document batch...
2025-11-14 15:32:42,661 - INFO - Processing document 8-K_2024-05-13
2025-11-14 15:32:42,737 - INFO - Finished converting document 8-K_2024-05-13 in 0.16 sec.


Converted 'data\edgar_documents\AMD\8-K_2024-04-30' --> 'data\processed_data\AMD\8-K_2024-04-30.md'
Converted 'data\edgar_documents\AMD\8-K_2024-05-13' --> 'data\processed_data\AMD\8-K_2024-05-13.md'


2025-11-14 15:32:42,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:42,866 - INFO - Going to convert document batch...
2025-11-14 15:32:42,867 - INFO - Processing document 8-K_2024-07-02
2025-11-14 15:32:42,929 - INFO - Finished converting document 8-K_2024-07-02 in 0.14 sec.
2025-11-14 15:32:42,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,010 - INFO - Going to convert document batch...
2025-11-14 15:32:43,012 - INFO - Processing document 8-K_2024-07-22
2025-11-14 15:32:43,059 - INFO - Finished converting document 8-K_2024-07-22 in 0.11 sec.


Converted 'data\edgar_documents\AMD\8-K_2024-07-02' --> 'data\processed_data\AMD\8-K_2024-07-02.md'
Converted 'data\edgar_documents\AMD\8-K_2024-07-22' --> 'data\processed_data\AMD\8-K_2024-07-22.md'


2025-11-14 15:32:43,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,172 - INFO - Going to convert document batch...
2025-11-14 15:32:43,175 - INFO - Processing document 8-K_2024-07-30
2025-11-14 15:32:43,234 - INFO - Finished converting document 8-K_2024-07-30 in 0.14 sec.
2025-11-14 15:32:43,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,330 - INFO - Going to convert document batch...
2025-11-14 15:32:43,332 - INFO - Processing document 8-K_2024-08-19
2025-11-14 15:32:43,396 - INFO - Finished converting document 8-K_2024-08-19 in 0.12 sec.
2025-11-14 15:32:43,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2024-07-30' --> 'data\processed_data\AMD\8-K_2024-07-30.md'
Converted 'data\edgar_documents\AMD\8-K_2024-08-19' --> 'data\processed_data\AMD\8-K_2024-08-19.md'


2025-11-14 15:32:43,474 - INFO - Going to convert document batch...
2025-11-14 15:32:43,475 - INFO - Processing document 8-K_2024-10-29
2025-11-14 15:32:43,547 - INFO - Finished converting document 8-K_2024-10-29 in 0.11 sec.
2025-11-14 15:32:43,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,630 - INFO - Going to convert document batch...
2025-11-14 15:32:43,633 - INFO - Processing document 8-K_2024-11-18
2025-11-14 15:32:43,685 - INFO - Finished converting document 8-K_2024-11-18 in 0.11 sec.


Converted 'data\edgar_documents\AMD\8-K_2024-10-29' --> 'data\processed_data\AMD\8-K_2024-10-29.md'
Converted 'data\edgar_documents\AMD\8-K_2024-11-18' --> 'data\processed_data\AMD\8-K_2024-11-18.md'


2025-11-14 15:32:43,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,808 - INFO - Going to convert document batch...
2025-11-14 15:32:43,810 - INFO - Processing document 8-K_2025-02-04
2025-11-14 15:32:43,866 - INFO - Finished converting document 8-K_2025-02-04 in 0.12 sec.
2025-11-14 15:32:43,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,971 - INFO - Going to convert document batch...
2025-11-14 15:32:43,973 - INFO - Processing document 8-K_2025-02-24
2025-11-14 15:32:44,031 - INFO - Finished converting document 8-K_2025-02-24 in 0.14 sec.


Converted 'data\edgar_documents\AMD\8-K_2025-02-04' --> 'data\processed_data\AMD\8-K_2025-02-04.md'
Converted 'data\edgar_documents\AMD\8-K_2025-02-24' --> 'data\processed_data\AMD\8-K_2025-02-24.md'


2025-11-14 15:32:44,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:44,129 - INFO - Going to convert document batch...
2025-11-14 15:32:44,130 - INFO - Processing document 8-K_2025-03-12
2025-11-14 15:32:44,177 - INFO - Finished converting document 8-K_2025-03-12 in 0.12 sec.
2025-11-14 15:32:44,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:44,263 - INFO - Going to convert document batch...
2025-11-14 15:32:44,265 - INFO - Processing document 8-K_2025-03-24
2025-11-14 15:32:44,322 - INFO - Finished converting document 8-K_2025-03-24 in 0.11 sec.
2025-11-14 15:32:44,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2025-03-12' --> 'data\processed_data\AMD\8-K_2025-03-12.md'
Converted 'data\edgar_documents\AMD\8-K_2025-03-24' --> 'data\processed_data\AMD\8-K_2025-03-24.md'


2025-11-14 15:32:44,412 - INFO - Going to convert document batch...
2025-11-14 15:32:44,416 - INFO - Processing document 8-K_2025-03-31
2025-11-14 15:32:44,503 - INFO - Finished converting document 8-K_2025-03-31 in 0.14 sec.
2025-11-14 15:32:44,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:44,640 - INFO - Going to convert document batch...
2025-11-14 15:32:44,643 - INFO - Processing document 8-K_2025-04-16
2025-11-14 15:32:44,686 - INFO - Finished converting document 8-K_2025-04-16 in 0.12 sec.
2025-11-14 15:32:44,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2025-03-31' --> 'data\processed_data\AMD\8-K_2025-03-31.md'
Converted 'data\edgar_documents\AMD\8-K_2025-04-16' --> 'data\processed_data\AMD\8-K_2025-04-16.md'


2025-11-14 15:32:44,781 - INFO - Going to convert document batch...
2025-11-14 15:32:44,782 - INFO - Processing document 8-K_2025-05-06
2025-11-14 15:32:44,854 - INFO - Finished converting document 8-K_2025-05-06 in 0.14 sec.
2025-11-14 15:32:44,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:44,965 - INFO - Going to convert document batch...
2025-11-14 15:32:44,968 - INFO - Processing document 8-K_2025-05-16
2025-11-14 15:32:45,080 - INFO - Finished converting document 8-K_2025-05-16 in 0.19 sec.


Converted 'data\edgar_documents\AMD\8-K_2025-05-06' --> 'data\processed_data\AMD\8-K_2025-05-06.md'


2025-11-14 15:32:45,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,185 - INFO - Going to convert document batch...
2025-11-14 15:32:45,187 - INFO - Processing document 8-K_2025-05-19
2025-11-14 15:32:45,227 - INFO - Finished converting document 8-K_2025-05-19 in 0.08 sec.
2025-11-14 15:32:45,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,330 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\8-K_2025-05-16' --> 'data\processed_data\AMD\8-K_2025-05-16.md'
Converted 'data\edgar_documents\AMD\8-K_2025-05-19' --> 'data\processed_data\AMD\8-K_2025-05-19.md'


2025-11-14 15:32:45,332 - INFO - Processing document 8-K_2025-06-03
2025-11-14 15:32:45,369 - INFO - Finished converting document 8-K_2025-06-03 in 0.09 sec.
2025-11-14 15:32:45,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,412 - INFO - Going to convert document batch...
2025-11-14 15:32:45,412 - INFO - Processing document 8-K_2025-07-02
2025-11-14 15:32:45,482 - INFO - Finished converting document 8-K_2025-07-02 in 0.11 sec.
2025-11-14 15:32:45,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2025-06-03' --> 'data\processed_data\AMD\8-K_2025-06-03.md'
Converted 'data\edgar_documents\AMD\8-K_2025-07-02' --> 'data\processed_data\AMD\8-K_2025-07-02.md'


2025-11-14 15:32:45,599 - INFO - Going to convert document batch...
2025-11-14 15:32:45,602 - INFO - Processing document 8-K_2025-08-05
2025-11-14 15:32:45,690 - INFO - Finished converting document 8-K_2025-08-05 in 0.16 sec.
2025-11-14 15:32:45,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,756 - INFO - Going to convert document batch...
2025-11-14 15:32:45,758 - INFO - Processing document 8-K_2025-08-25
2025-11-14 15:32:45,784 - INFO - Finished converting document 8-K_2025-08-25 in 0.08 sec.
2025-11-14 15:32:45,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,869 - INFO - Going to convert document batch...
2025-11-14 15:32:45,870 - INFO - Processing document 8-K_2025-10-06
2025-11-14 15:32:45,911 - INFO - Finished converting document 8-K_2025-10-06 in 0.11 sec.


Converted 'data\edgar_documents\AMD\8-K_2025-08-05' --> 'data\processed_data\AMD\8-K_2025-08-05.md'
Converted 'data\edgar_documents\AMD\8-K_2025-08-25' --> 'data\processed_data\AMD\8-K_2025-08-25.md'


2025-11-14 15:32:45,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:46,009 - INFO - Going to convert document batch...
2025-11-14 15:32:46,011 - INFO - Processing document 8-K_2025-10-27
2025-11-14 15:32:46,086 - INFO - Finished converting document 8-K_2025-10-27 in 0.12 sec.
2025-11-14 15:32:46,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2025-10-06' --> 'data\processed_data\AMD\8-K_2025-10-06.md'
Converted 'data\edgar_documents\AMD\8-K_2025-10-27' --> 'data\processed_data\AMD\8-K_2025-10-27.md'


2025-11-14 15:32:46,160 - INFO - Going to convert document batch...
2025-11-14 15:32:46,162 - INFO - Processing document 8-K_2025-11-04
2025-11-14 15:32:46,227 - INFO - Finished converting document 8-K_2025-11-04 in 0.09 sec.
2025-11-14 15:32:46,374 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:32:46,375 - ERROR - Input document DEF-14A_2023-03-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:32:46,382 - INFO - Going to convert 

Converted 'data\edgar_documents\AMD\8-K_2025-11-04' --> 'data\processed_data\AMD\8-K_2025-11-04.md'
Error processing data\edgar_documents\AMD\DEF-14A_2023-03-31: File format not allowed: data\edgar_documents\AMD\DEF-14A_2023-03-31


2025-11-14 15:32:46,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:49,093 - INFO - Going to convert document batch...
2025-11-14 15:32:49,095 - INFO - Processing document DEF-14A_2024-03-25
2025-11-14 15:32:52,718 - INFO - Finished converting document DEF-14A_2024-03-25 in 6.34 sec.
2025-11-14 15:32:54,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\DEF-14A_2024-03-25' --> 'data\processed_data\AMD\DEF-14A_2024-03-25.md'


2025-11-14 15:32:56,681 - INFO - Going to convert document batch...
2025-11-14 15:32:56,683 - INFO - Processing document DEF-14A_2025-03-28
2025-11-14 15:33:00,552 - INFO - Finished converting document DEF-14A_2025-03-28 in 5.91 sec.


Converted 'data\edgar_documents\AMD\DEF-14A_2025-03-28' --> 'data\processed_data\AMD\DEF-14A_2025-03-28.md'
Processed 144 new files. Errors: 3
Found 92 files to process in data\edgar_documents\AMGN


2025-11-14 15:33:02,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:33:04,657 - INFO - Going to convert document batch...
2025-11-14 15:33:04,658 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:33:04,661 - INFO - Processing document 10-K_2023-02-09
2025-11-14 15:33:10,874 - INFO - Finished converting document 10-K_2023-02-09 in 8.72 sec.
2025-11-14 15:33:12,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-K_2023-02-09' --> 'data\processed_data\AMGN\10-K_2023-02-09.md'


2025-11-14 15:33:14,290 - INFO - Going to convert document batch...
2025-11-14 15:33:14,291 - INFO - Processing document 10-K_2024-02-14
2025-11-14 15:33:19,188 - INFO - Finished converting document 10-K_2024-02-14 in 6.91 sec.
2025-11-14 15:33:21,251 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:33:21,252 - ERROR - Input document 10-K_2025-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:33:21,256 - INFO - Going to convert d

Converted 'data\edgar_documents\AMGN\10-K_2024-02-14' --> 'data\processed_data\AMGN\10-K_2024-02-14.md'
Error processing data\edgar_documents\AMGN\10-K_2025-02-14: File format not allowed: data\edgar_documents\AMGN\10-K_2025-02-14


2025-11-14 15:33:22,319 - INFO - Going to convert document batch...
2025-11-14 15:33:22,321 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 15:33:24,730 - INFO - Finished converting document 10-Q_2023-04-28 in 3.48 sec.
2025-11-14 15:33:25,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2023-04-28' --> 'data\processed_data\AMGN\10-Q_2023-04-28.md'


2025-11-14 15:33:28,443 - INFO - Going to convert document batch...
2025-11-14 15:33:28,445 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 15:33:31,476 - INFO - Finished converting document 10-Q_2023-08-04 in 5.58 sec.
2025-11-14 15:33:32,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2023-08-04' --> 'data\processed_data\AMGN\10-Q_2023-08-04.md'


2025-11-14 15:33:33,516 - INFO - Going to convert document batch...
2025-11-14 15:33:33,517 - INFO - Processing document 10-Q_2023-10-31
2025-11-14 15:33:35,118 - INFO - Finished converting document 10-Q_2023-10-31 in 2.42 sec.
2025-11-14 15:33:36,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2023-10-31' --> 'data\processed_data\AMGN\10-Q_2023-10-31.md'


2025-11-14 15:33:37,536 - INFO - Going to convert document batch...
2025-11-14 15:33:37,537 - INFO - Processing document 10-Q_2024-05-03
2025-11-14 15:33:40,362 - INFO - Finished converting document 10-Q_2024-05-03 in 4.01 sec.
2025-11-14 15:33:41,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2024-05-03' --> 'data\processed_data\AMGN\10-Q_2024-05-03.md'


2025-11-14 15:33:43,684 - INFO - Going to convert document batch...
2025-11-14 15:33:43,686 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 15:33:47,023 - INFO - Finished converting document 10-Q_2024-08-07 in 5.38 sec.
2025-11-14 15:33:48,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2024-08-07' --> 'data\processed_data\AMGN\10-Q_2024-08-07.md'


2025-11-14 15:33:50,929 - INFO - Going to convert document batch...
2025-11-14 15:33:50,931 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 15:33:53,728 - INFO - Finished converting document 10-Q_2024-10-31 in 5.31 sec.
2025-11-14 15:33:55,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2024-10-31' --> 'data\processed_data\AMGN\10-Q_2024-10-31.md'


2025-11-14 15:33:57,224 - INFO - Going to convert document batch...
2025-11-14 15:33:57,226 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 15:33:59,879 - INFO - Finished converting document 10-Q_2025-05-02 in 4.70 sec.
2025-11-14 15:34:01,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2025-05-02' --> 'data\processed_data\AMGN\10-Q_2025-05-02.md'


2025-11-14 15:34:03,034 - INFO - Going to convert document batch...
2025-11-14 15:34:03,035 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 15:34:06,037 - INFO - Finished converting document 10-Q_2025-08-06 in 4.77 sec.
2025-11-14 15:34:08,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2025-08-06' --> 'data\processed_data\AMGN\10-Q_2025-08-06.md'


2025-11-14 15:34:10,487 - INFO - Going to convert document batch...
2025-11-14 15:34:10,489 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 15:34:13,921 - INFO - Finished converting document 10-Q_2025-11-05 in 5.16 sec.
2025-11-14 15:34:15,572 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:34:15,573 - ERROR - Input document 4_2023-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:34:15,574 - INFO - Going to convert document batch...
2025-11-14 15:34:15,59

Converted 'data\edgar_documents\AMGN\10-Q_2025-11-05' --> 'data\processed_data\AMGN\10-Q_2025-11-05.md'
Error processing data\edgar_documents\AMGN\4_2023-02-14: File format not allowed: data\edgar_documents\AMGN\4_2023-02-14
Error processing data\edgar_documents\AMGN\4_2023-02-17: File format not allowed: data\edgar_documents\AMGN\4_2023-02-17
Converted 'data\edgar_documents\AMGN\4_2023-03-08' --> 'data\processed_data\AMGN\4_2023-03-08.md'


2025-11-14 15:34:15,770 - INFO - Going to convert document batch...
2025-11-14 15:34:15,772 - INFO - Processing document 4_2023-03-20
2025-11-14 15:34:15,867 - INFO - Finished converting document 4_2023-03-20 in 0.12 sec.
2025-11-14 15:34:15,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:15,985 - INFO - Going to convert document batch...
2025-11-14 15:34:15,987 - INFO - Processing document 4_2023-05-02
2025-11-14 15:34:16,048 - INFO - Finished converting document 4_2023-05-02 in 0.11 sec.


Converted 'data\edgar_documents\AMGN\4_2023-03-20' --> 'data\processed_data\AMGN\4_2023-03-20.md'
Converted 'data\edgar_documents\AMGN\4_2023-05-02' --> 'data\processed_data\AMGN\4_2023-05-02.md'


2025-11-14 15:34:16,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:16,174 - INFO - Going to convert document batch...
2025-11-14 15:34:16,176 - INFO - Processing document 4_2023-05-03
2025-11-14 15:34:16,214 - INFO - Finished converting document 4_2023-05-03 in 0.11 sec.
2025-11-14 15:34:16,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:16,306 - INFO - Going to convert document batch...
2025-11-14 15:34:16,313 - INFO - Processing document 4_2023-05-04
2025-11-14 15:34:16,397 - INFO - Finished converting document 4_2023-05-04 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\4_2023-05-03' --> 'data\processed_data\AMGN\4_2023-05-03.md'


2025-11-14 15:34:16,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2023-05-04' --> 'data\processed_data\AMGN\4_2023-05-04.md'


2025-11-14 15:34:17,285 - INFO - Going to convert document batch...
2025-11-14 15:34:17,287 - INFO - Processing document 4_2023-05-09
2025-11-14 15:34:17,332 - INFO - Finished converting document 4_2023-05-09 in 0.89 sec.
2025-11-14 15:34:17,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,410 - INFO - Going to convert document batch...
2025-11-14 15:34:17,410 - INFO - Processing document 4_2023-05-23
2025-11-14 15:34:17,441 - INFO - Finished converting document 4_2023-05-23 in 0.06 sec.
2025-11-14 15:34:17,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,545 - INFO - Going to convert document batch...
2025-11-14 15:34:17,547 - INFO - Processing document 4_2023-07-31


Converted 'data\edgar_documents\AMGN\4_2023-05-09' --> 'data\processed_data\AMGN\4_2023-05-09.md'
Converted 'data\edgar_documents\AMGN\4_2023-05-23' --> 'data\processed_data\AMGN\4_2023-05-23.md'


2025-11-14 15:34:17,604 - INFO - Finished converting document 4_2023-07-31 in 0.12 sec.
2025-11-14 15:34:17,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,713 - INFO - Going to convert document batch...
2025-11-14 15:34:17,714 - INFO - Processing document 4_2023-08-10
2025-11-14 15:34:17,749 - INFO - Finished converting document 4_2023-08-10 in 0.08 sec.
2025-11-14 15:34:17,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,823 - INFO - Going to convert document batch...
2025-11-14 15:34:17,824 - INFO - Processing document 4_2023-08-11


Converted 'data\edgar_documents\AMGN\4_2023-07-31' --> 'data\processed_data\AMGN\4_2023-07-31.md'
Converted 'data\edgar_documents\AMGN\4_2023-08-10' --> 'data\processed_data\AMGN\4_2023-08-10.md'


2025-11-14 15:34:17,862 - INFO - Finished converting document 4_2023-08-11 in 0.08 sec.
2025-11-14 15:34:17,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,931 - INFO - Going to convert document batch...
2025-11-14 15:34:17,931 - INFO - Processing document 4_2023-09-19
2025-11-14 15:34:18,003 - INFO - Finished converting document 4_2023-09-19 in 0.11 sec.
2025-11-14 15:34:18,061 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2023-08-11' --> 'data\processed_data\AMGN\4_2023-08-11.md'
Converted 'data\edgar_documents\AMGN\4_2023-09-19' --> 'data\processed_data\AMGN\4_2023-09-19.md'


2025-11-14 15:34:18,085 - INFO - Going to convert document batch...
2025-11-14 15:34:18,087 - INFO - Processing document 4_2023-11-03
2025-11-14 15:34:18,168 - INFO - Finished converting document 4_2023-11-03 in 0.12 sec.
2025-11-14 15:34:18,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,227 - INFO - Going to convert document batch...
2025-11-14 15:34:18,228 - INFO - Processing document 4_2023-11-07
2025-11-14 15:34:18,281 - INFO - Finished converting document 4_2023-11-07 in 0.08 sec.
2025-11-14 15:34:18,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2023-11-03' --> 'data\processed_data\AMGN\4_2023-11-03.md'
Converted 'data\edgar_documents\AMGN\4_2023-11-07' --> 'data\processed_data\AMGN\4_2023-11-07.md'


2025-11-14 15:34:18,395 - INFO - Going to convert document batch...
2025-11-14 15:34:18,396 - INFO - Processing document 4_2023-11-13
2025-11-14 15:34:18,432 - INFO - Finished converting document 4_2023-11-13 in 0.09 sec.
2025-11-14 15:34:18,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,514 - INFO - Going to convert document batch...
2025-11-14 15:34:18,516 - INFO - Processing document 4_2023-11-29
2025-11-14 15:34:18,581 - INFO - Finished converting document 4_2023-11-29 in 0.11 sec.


Converted 'data\edgar_documents\AMGN\4_2023-11-13' --> 'data\processed_data\AMGN\4_2023-11-13.md'


2025-11-14 15:34:18,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,709 - INFO - Going to convert document batch...
2025-11-14 15:34:18,710 - INFO - Processing document 4_2023-12-04
2025-11-14 15:34:18,746 - INFO - Finished converting document 4_2023-12-04 in 0.08 sec.
2025-11-14 15:34:18,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,811 - INFO - Going to convert document batch...
2025-11-14 15:34:18,815 - INFO - Processing document 4_2024-02-12


Converted 'data\edgar_documents\AMGN\4_2023-11-29' --> 'data\processed_data\AMGN\4_2023-11-29.md'
Converted 'data\edgar_documents\AMGN\4_2023-12-04' --> 'data\processed_data\AMGN\4_2023-12-04.md'


2025-11-14 15:34:18,856 - INFO - Finished converting document 4_2024-02-12 in 0.08 sec.
2025-11-14 15:34:18,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,975 - INFO - Going to convert document batch...
2025-11-14 15:34:18,977 - INFO - Processing document 4_2024-03-08
2025-11-14 15:34:19,030 - INFO - Finished converting document 4_2024-03-08 in 0.11 sec.
2025-11-14 15:34:19,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2024-02-12' --> 'data\processed_data\AMGN\4_2024-02-12.md'
Converted 'data\edgar_documents\AMGN\4_2024-03-08' --> 'data\processed_data\AMGN\4_2024-03-08.md'


2025-11-14 15:34:19,123 - INFO - Going to convert document batch...
2025-11-14 15:34:19,125 - INFO - Processing document 4_2024-03-20
2025-11-14 15:34:19,161 - INFO - Finished converting document 4_2024-03-20 in 0.08 sec.
2025-11-14 15:34:19,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,241 - INFO - Going to convert document batch...
2025-11-14 15:34:19,242 - INFO - Processing document 4_2024-05-01
2025-11-14 15:34:19,280 - INFO - Finished converting document 4_2024-05-01 in 0.08 sec.
2025-11-14 15:34:19,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2024-03-20' --> 'data\processed_data\AMGN\4_2024-03-20.md'
Converted 'data\edgar_documents\AMGN\4_2024-05-01' --> 'data\processed_data\AMGN\4_2024-05-01.md'


2025-11-14 15:34:19,392 - INFO - Going to convert document batch...
2025-11-14 15:34:19,395 - INFO - Processing document 4_2024-05-02
2025-11-14 15:34:19,461 - INFO - Finished converting document 4_2024-05-02 in 0.12 sec.
2025-11-14 15:34:19,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,589 - INFO - Going to convert document batch...
2025-11-14 15:34:19,590 - INFO - Processing document 4_2024-05-03
2025-11-14 15:34:19,626 - INFO - Finished converting document 4_2024-05-03 in 0.09 sec.
2025-11-14 15:34:19,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,705 - INFO - Going to convert document batch...
2025-11-14 15:34:19,706 - INFO - Processing document 4_2024-05-06
2025-11-14 15:34:19,736 - INFO - Finished converting document 4_2024-05-06 in 0.08 sec.


Converted 'data\edgar_documents\AMGN\4_2024-05-02' --> 'data\processed_data\AMGN\4_2024-05-02.md'
Converted 'data\edgar_documents\AMGN\4_2024-05-03' --> 'data\processed_data\AMGN\4_2024-05-03.md'


2025-11-14 15:34:19,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,789 - INFO - Going to convert document batch...
2025-11-14 15:34:19,790 - INFO - Processing document 4_2024-05-07
2025-11-14 15:34:19,819 - INFO - Finished converting document 4_2024-05-07 in 0.05 sec.
2025-11-14 15:34:19,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,924 - INFO - Going to convert document batch...
2025-11-14 15:34:19,926 - INFO - Processing document 4_2024-05-08


Converted 'data\edgar_documents\AMGN\4_2024-05-06' --> 'data\processed_data\AMGN\4_2024-05-06.md'
Converted 'data\edgar_documents\AMGN\4_2024-05-07' --> 'data\processed_data\AMGN\4_2024-05-07.md'


2025-11-14 15:34:20,006 - INFO - Finished converting document 4_2024-05-08 in 0.14 sec.
2025-11-14 15:34:20,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,112 - INFO - Going to convert document batch...
2025-11-14 15:34:20,115 - INFO - Processing document 4_2024-05-09
2025-11-14 15:34:20,165 - INFO - Finished converting document 4_2024-05-09 in 0.09 sec.
2025-11-14 15:34:20,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2024-05-08' --> 'data\processed_data\AMGN\4_2024-05-08.md'
Converted 'data\edgar_documents\AMGN\4_2024-05-09' --> 'data\processed_data\AMGN\4_2024-05-09.md'


2025-11-14 15:34:20,250 - INFO - Going to convert document batch...
2025-11-14 15:34:20,251 - INFO - Processing document 4_2024-06-04
2025-11-14 15:34:20,287 - INFO - Finished converting document 4_2024-06-04 in 0.08 sec.
2025-11-14 15:34:20,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,371 - INFO - Going to convert document batch...
2025-11-14 15:34:20,373 - INFO - Processing document 4_2024-07-31
2025-11-14 15:34:20,453 - INFO - Finished converting document 4_2024-07-31 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\4_2024-06-04' --> 'data\processed_data\AMGN\4_2024-06-04.md'
Converted 'data\edgar_documents\AMGN\4_2024-07-31' --> 'data\processed_data\AMGN\4_2024-07-31.md'


2025-11-14 15:34:20,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,537 - INFO - Going to convert document batch...
2025-11-14 15:34:20,540 - INFO - Processing document 4_2024-08-13
2025-11-14 15:34:20,604 - INFO - Finished converting document 4_2024-08-13 in 0.12 sec.
2025-11-14 15:34:20,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,708 - INFO - Going to convert document batch...
2025-11-14 15:34:20,711 - INFO - Processing document 4_2024-11-06
2025-11-14 15:34:20,756 - INFO - Finished converting document 4_2024-11-06 in 0.09 sec.
2025-11-14 15:34:20,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2024-08-13' --> 'data\processed_data\AMGN\4_2024-08-13.md'
Converted 'data\edgar_documents\AMGN\4_2024-11-06' --> 'data\processed_data\AMGN\4_2024-11-06.md'


2025-11-14 15:34:20,882 - INFO - Going to convert document batch...
2025-11-14 15:34:20,884 - INFO - Processing document 4_2024-12-03
2025-11-14 15:34:20,935 - INFO - Finished converting document 4_2024-12-03 in 0.14 sec.
2025-11-14 15:34:20,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,991 - INFO - Going to convert document batch...
2025-11-14 15:34:20,993 - INFO - Processing document 4_2024-12-06
2025-11-14 15:34:21,023 - INFO - Finished converting document 4_2024-12-06 in 0.05 sec.
2025-11-14 15:34:21,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,139 - INFO - Going to convert document batch...
2025-11-14 15:34:21,140 - INFO - Processing document 4_2025-02-06


Converted 'data\edgar_documents\AMGN\4_2024-12-03' --> 'data\processed_data\AMGN\4_2024-12-03.md'
Converted 'data\edgar_documents\AMGN\4_2024-12-06' --> 'data\processed_data\AMGN\4_2024-12-06.md'


2025-11-14 15:34:21,195 - INFO - Finished converting document 4_2025-02-06 in 0.09 sec.
2025-11-14 15:34:21,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,290 - INFO - Going to convert document batch...
2025-11-14 15:34:21,291 - INFO - Processing document 4_2025-02-10
2025-11-14 15:34:21,332 - INFO - Finished converting document 4_2025-02-10 in 0.08 sec.
2025-11-14 15:34:21,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,442 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\4_2025-02-06' --> 'data\processed_data\AMGN\4_2025-02-06.md'
Converted 'data\edgar_documents\AMGN\4_2025-02-10' --> 'data\processed_data\AMGN\4_2025-02-10.md'


2025-11-14 15:34:21,444 - INFO - Processing document 4_2025-02-13
2025-11-14 15:34:21,516 - INFO - Finished converting document 4_2025-02-13 in 0.12 sec.
2025-11-14 15:34:21,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,632 - INFO - Going to convert document batch...
2025-11-14 15:34:21,634 - INFO - Processing document 4_2025-02-20
2025-11-14 15:34:21,701 - INFO - Finished converting document 4_2025-02-20 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\4_2025-02-13' --> 'data\processed_data\AMGN\4_2025-02-13.md'
Converted 'data\edgar_documents\AMGN\4_2025-02-20' --> 'data\processed_data\AMGN\4_2025-02-20.md'


2025-11-14 15:34:21,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,831 - INFO - Going to convert document batch...
2025-11-14 15:34:21,834 - INFO - Processing document 4_2025-02-21
2025-11-14 15:34:21,906 - INFO - Finished converting document 4_2025-02-21 in 0.16 sec.
2025-11-14 15:34:21,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,005 - INFO - Going to convert document batch...
2025-11-14 15:34:22,005 - INFO - Processing document 4_2025-03-05
2025-11-14 15:34:22,065 - INFO - Finished converting document 4_2025-03-05 in 0.11 sec.


Converted 'data\edgar_documents\AMGN\4_2025-02-21' --> 'data\processed_data\AMGN\4_2025-02-21.md'
Converted 'data\edgar_documents\AMGN\4_2025-03-05' --> 'data\processed_data\AMGN\4_2025-03-05.md'


2025-11-14 15:34:22,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,186 - INFO - Going to convert document batch...
2025-11-14 15:34:22,188 - INFO - Processing document 4_2025-03-19
2025-11-14 15:34:22,257 - INFO - Finished converting document 4_2025-03-19 in 0.12 sec.
2025-11-14 15:34:22,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,347 - INFO - Going to convert document batch...
2025-11-14 15:34:22,349 - INFO - Processing document 4_2025-05-02
2025-11-14 15:34:22,395 - INFO - Finished converting document 4_2025-05-02 in 0.08 sec.
2025-11-14 15:34:22,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,507 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\4_2025-03-19' --> 'data\processed_data\AMGN\4_2025-03-19.md'
Converted 'data\edgar_documents\AMGN\4_2025-05-02' --> 'data\processed_data\AMGN\4_2025-05-02.md'


2025-11-14 15:34:22,508 - INFO - Processing document 4_2025-05-06
2025-11-14 15:34:22,572 - INFO - Finished converting document 4_2025-05-06 in 0.11 sec.
2025-11-14 15:34:22,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,652 - INFO - Going to convert document batch...
2025-11-14 15:34:22,654 - INFO - Processing document 4_2025-05-08
2025-11-14 15:34:22,700 - INFO - Finished converting document 4_2025-05-08 in 0.08 sec.
2025-11-14 15:34:22,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,772 - INFO - Going to convert document batch...
2025-11-14 15:34:22,774 - INFO - Processing document 4_2025-05-28


Converted 'data\edgar_documents\AMGN\4_2025-05-06' --> 'data\processed_data\AMGN\4_2025-05-06.md'
Converted 'data\edgar_documents\AMGN\4_2025-05-08' --> 'data\processed_data\AMGN\4_2025-05-08.md'


2025-11-14 15:34:22,824 - INFO - Finished converting document 4_2025-05-28 in 0.09 sec.
2025-11-14 15:34:22,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,897 - INFO - Going to convert document batch...
2025-11-14 15:34:22,899 - INFO - Processing document 4_2025-06-06
2025-11-14 15:34:22,964 - INFO - Finished converting document 4_2025-06-06 in 0.11 sec.
2025-11-14 15:34:23,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2025-05-28' --> 'data\processed_data\AMGN\4_2025-05-28.md'
Converted 'data\edgar_documents\AMGN\4_2025-06-06' --> 'data\processed_data\AMGN\4_2025-06-06.md'


2025-11-14 15:34:23,065 - INFO - Going to convert document batch...
2025-11-14 15:34:23,067 - INFO - Processing document 4_2025-08-12
2025-11-14 15:34:23,124 - INFO - Finished converting document 4_2025-08-12 in 0.11 sec.
2025-11-14 15:34:23,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,223 - INFO - Going to convert document batch...
2025-11-14 15:34:23,224 - INFO - Processing document 4_2025-08-22
2025-11-14 15:34:23,261 - INFO - Finished converting document 4_2025-08-22 in 0.08 sec.
2025-11-14 15:34:23,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,353 - INFO - Going to convert document batch...
2025-11-14 15:34:23,355 - INFO - Processing document 4_2025-11-07


Converted 'data\edgar_documents\AMGN\4_2025-08-12' --> 'data\processed_data\AMGN\4_2025-08-12.md'
Converted 'data\edgar_documents\AMGN\4_2025-08-22' --> 'data\processed_data\AMGN\4_2025-08-22.md'


2025-11-14 15:34:23,409 - INFO - Finished converting document 4_2025-11-07 in 0.11 sec.
2025-11-14 15:34:23,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,523 - INFO - Going to convert document batch...
2025-11-14 15:34:23,524 - INFO - Processing document 8-K_2023-01-31
2025-11-14 15:34:23,582 - INFO - Finished converting document 8-K_2023-01-31 in 0.11 sec.
2025-11-14 15:34:23,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2025-11-07' --> 'data\processed_data\AMGN\4_2025-11-07.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-01-31' --> 'data\processed_data\AMGN\8-K_2023-01-31.md'


2025-11-14 15:34:23,688 - INFO - Going to convert document batch...
2025-11-14 15:34:23,690 - INFO - Processing document 8-K_2023-02-16
2025-11-14 15:34:23,735 - INFO - Finished converting document 8-K_2023-02-16 in 0.14 sec.
2025-11-14 15:34:23,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,805 - INFO - Going to convert document batch...
2025-11-14 15:34:23,807 - INFO - Processing document 8-K_2023-03-02
2025-11-14 15:34:23,864 - INFO - Finished converting document 8-K_2023-03-02 in 0.09 sec.
2025-11-14 15:34:23,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,950 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\8-K_2023-02-16' --> 'data\processed_data\AMGN\8-K_2023-02-16.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-03-02' --> 'data\processed_data\AMGN\8-K_2023-03-02.md'


2025-11-14 15:34:23,950 - INFO - Processing document 8-K_2023-03-09
2025-11-14 15:34:24,002 - INFO - Finished converting document 8-K_2023-03-09 in 0.11 sec.
2025-11-14 15:34:24,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,074 - INFO - Going to convert document batch...
2025-11-14 15:34:24,075 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:34:24,119 - INFO - Finished converting document 8-K_2023-04-27 in 0.09 sec.
2025-11-14 15:34:24,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,209 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\8-K_2023-03-09' --> 'data\processed_data\AMGN\8-K_2023-03-09.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-04-27' --> 'data\processed_data\AMGN\8-K_2023-04-27.md'


2025-11-14 15:34:24,212 - INFO - Processing document 8-K_2023-05-16
2025-11-14 15:34:24,264 - INFO - Finished converting document 8-K_2023-05-16 in 0.12 sec.
2025-11-14 15:34:24,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,362 - INFO - Going to convert document batch...
2025-11-14 15:34:24,364 - INFO - Processing document 8-K_2023-05-18
2025-11-14 15:34:24,412 - INFO - Finished converting document 8-K_2023-05-18 in 0.11 sec.
2025-11-14 15:34:24,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\8-K_2023-05-16' --> 'data\processed_data\AMGN\8-K_2023-05-16.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-05-18' --> 'data\processed_data\AMGN\8-K_2023-05-18.md'


2025-11-14 15:34:24,526 - INFO - Going to convert document batch...
2025-11-14 15:34:24,528 - INFO - Processing document 8-K_2023-05-22
2025-11-14 15:34:24,631 - INFO - Finished converting document 8-K_2023-05-22 in 0.19 sec.
2025-11-14 15:34:24,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,716 - INFO - Going to convert document batch...
2025-11-14 15:34:24,720 - INFO - Processing document 8-K_2023-06-05
2025-11-14 15:34:24,769 - INFO - Finished converting document 8-K_2023-06-05 in 0.09 sec.
2025-11-14 15:34:24,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,871 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\8-K_2023-05-22' --> 'data\processed_data\AMGN\8-K_2023-05-22.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-06-05' --> 'data\processed_data\AMGN\8-K_2023-06-05.md'


2025-11-14 15:34:24,873 - INFO - Processing document 8-K_2023-08-03
2025-11-14 15:34:24,952 - INFO - Finished converting document 8-K_2023-08-03 in 0.16 sec.
2025-11-14 15:34:25,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,039 - INFO - Going to convert document batch...
2025-11-14 15:34:25,041 - INFO - Processing document 8-K_2023-08-04
2025-11-14 15:34:25,093 - INFO - Finished converting document 8-K_2023-08-04 in 0.11 sec.
2025-11-14 15:34:25,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\8-K_2023-08-03' --> 'data\processed_data\AMGN\8-K_2023-08-03.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-08-04' --> 'data\processed_data\AMGN\8-K_2023-08-04.md'


2025-11-14 15:34:25,189 - INFO - Going to convert document batch...
2025-11-14 15:34:25,193 - INFO - Processing document 8-K_2023-09-01
2025-11-14 15:34:25,227 - INFO - Finished converting document 8-K_2023-09-01 in 0.09 sec.
2025-11-14 15:34:25,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,280 - INFO - Going to convert document batch...
2025-11-14 15:34:25,281 - INFO - Processing document 8-K_2023-09-05
2025-11-14 15:34:25,317 - INFO - Finished converting document 8-K_2023-09-05 in 0.08 sec.
2025-11-14 15:34:25,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,380 - INFO - Going to convert document batch...
2025-11-14 15:34:25,381 - INFO - Processing document 8-K_2023-09-12
2025-11-14 15:34:25,413 - INFO - Finished converting document 8-K_2023-09-12 in 0.08 sec.


Converted 'data\edgar_documents\AMGN\8-K_2023-09-01' --> 'data\processed_data\AMGN\8-K_2023-09-01.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-09-05' --> 'data\processed_data\AMGN\8-K_2023-09-05.md'


2025-11-14 15:34:25,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,467 - INFO - Going to convert document batch...
2025-11-14 15:34:25,470 - INFO - Processing document 8-K_2023-10-05
2025-11-14 15:34:25,510 - INFO - Finished converting document 8-K_2023-10-05 in 0.08 sec.
2025-11-14 15:34:25,546 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,580 - INFO - Going to convert document batch...
2025-11-14 15:34:25,581 - INFO - Processing document 8-K_2023-10-06
2025-11-14 15:34:25,625 - INFO - Finished converting document 8-K_2023-10-06 in 0.09 sec.


Converted 'data\edgar_documents\AMGN\8-K_2023-09-12' --> 'data\processed_data\AMGN\8-K_2023-09-12.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-10-05' --> 'data\processed_data\AMGN\8-K_2023-10-05.md'


2025-11-14 15:34:25,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,698 - INFO - Going to convert document batch...
2025-11-14 15:34:25,699 - INFO - Processing document 8-K_2023-10-31
2025-11-14 15:34:25,736 - INFO - Finished converting document 8-K_2023-10-31 in 0.08 sec.
2025-11-14 15:34:25,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,824 - INFO - Going to convert document batch...
2025-11-14 15:34:25,824 - INFO - Processing document 8-K_2023-12-14


Converted 'data\edgar_documents\AMGN\8-K_2023-10-06' --> 'data\processed_data\AMGN\8-K_2023-10-06.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-10-31' --> 'data\processed_data\AMGN\8-K_2023-10-31.md'


2025-11-14 15:34:25,882 - INFO - Finished converting document 8-K_2023-12-14 in 0.12 sec.
2025-11-14 15:34:25,948 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:34:25,951 - ERROR - Input document 8-K_2024-02-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:34:25,953 - INFO - Going to convert document batch...
2025-11-14 15:34:25,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:26,015 - INFO - Going to convert document batch...
2025-11-14

Converted 'data\edgar_documents\AMGN\8-K_2023-12-14' --> 'data\processed_data\AMGN\8-K_2023-12-14.md'
Error processing data\edgar_documents\AMGN\8-K_2024-02-06: File format not allowed: data\edgar_documents\AMGN\8-K_2024-02-06


2025-11-14 15:34:26,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\8-K_2024-05-02' --> 'data\processed_data\AMGN\8-K_2024-05-02.md'


2025-11-14 15:34:26,793 - INFO - Going to convert document batch...
2025-11-14 15:34:26,796 - INFO - Processing document 8-K_2024-06-03
2025-11-14 15:34:26,887 - INFO - Finished converting document 8-K_2024-06-03 in 0.78 sec.
2025-11-14 15:34:26,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:26,995 - INFO - Going to convert document batch...
2025-11-14 15:34:26,997 - INFO - Processing document 8-K_2024-08-06
2025-11-14 15:34:27,062 - INFO - Finished converting document 8-K_2024-08-06 in 0.12 sec.


Converted 'data\edgar_documents\AMGN\8-K_2024-06-03' --> 'data\processed_data\AMGN\8-K_2024-06-03.md'
Converted 'data\edgar_documents\AMGN\8-K_2024-08-06' --> 'data\processed_data\AMGN\8-K_2024-08-06.md'


2025-11-14 15:34:27,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,159 - INFO - Going to convert document batch...
2025-11-14 15:34:27,161 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:34:27,233 - INFO - Finished converting document 8-K_2024-10-30 in 0.14 sec.
2025-11-14 15:34:27,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,300 - INFO - Going to convert document batch...
2025-11-14 15:34:27,301 - INFO - Processing document 8-K_2025-02-04
2025-11-14 15:34:27,363 - INFO - Finished converting document 8-K_2025-02-04 in 0.09 sec.
2025-11-14 15:34:27,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,473 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\8-K_2024-10-30' --> 'data\processed_data\AMGN\8-K_2024-10-30.md'
Converted 'data\edgar_documents\AMGN\8-K_2025-02-04' --> 'data\processed_data\AMGN\8-K_2025-02-04.md'


2025-11-14 15:34:27,475 - INFO - Processing document 8-K_2025-05-01
2025-11-14 15:34:27,551 - INFO - Finished converting document 8-K_2025-05-01 in 0.14 sec.
2025-11-14 15:34:27,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,659 - INFO - Going to convert document batch...
2025-11-14 15:34:27,661 - INFO - Processing document 8-K_2025-05-27
2025-11-14 15:34:27,726 - INFO - Finished converting document 8-K_2025-05-27 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\8-K_2025-05-01' --> 'data\processed_data\AMGN\8-K_2025-05-01.md'
Converted 'data\edgar_documents\AMGN\8-K_2025-05-27' --> 'data\processed_data\AMGN\8-K_2025-05-27.md'


2025-11-14 15:34:27,779 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,820 - INFO - Going to convert document batch...
2025-11-14 15:34:27,822 - INFO - Processing document 8-K_2025-08-05
2025-11-14 15:34:27,893 - INFO - Finished converting document 8-K_2025-08-05 in 0.14 sec.
2025-11-14 15:34:27,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:28,012 - INFO - Going to convert document batch...
2025-11-14 15:34:28,014 - INFO - Processing document 8-K_2025-11-04
2025-11-14 15:34:28,074 - INFO - Finished converting document 8-K_2025-11-04 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\8-K_2025-08-05' --> 'data\processed_data\AMGN\8-K_2025-08-05.md'
Converted 'data\edgar_documents\AMGN\8-K_2025-11-04' --> 'data\processed_data\AMGN\8-K_2025-11-04.md'


2025-11-14 15:34:28,222 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:34:28,224 - ERROR - Input document DEF-14A_2023-04-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:34:28,229 - INFO - Going to convert document batch...
2025-11-14 15:34:28,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\AMGN\DEF-14A_2023-04-06: File format not allowed: data\edgar_documents\AMGN\DEF-14A_2023-04-06


2025-11-14 15:34:32,285 - INFO - Going to convert document batch...
2025-11-14 15:34:32,286 - INFO - Processing document DEF-14A_2024-04-17
2025-11-14 15:34:53,622 - INFO - Finished converting document DEF-14A_2024-04-17 in 25.39 sec.
2025-11-14 15:34:57,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\DEF-14A_2024-04-17' --> 'data\processed_data\AMGN\DEF-14A_2024-04-17.md'


2025-11-14 15:35:00,992 - INFO - Going to convert document batch...
2025-11-14 15:35:00,993 - INFO - Processing document DEF-14A_2025-04-09
2025-11-14 15:35:08,486 - INFO - Finished converting document DEF-14A_2025-04-09 in 11.62 sec.
2025-11-14 15:35:10,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\DEF-14A_2025-04-09' --> 'data\processed_data\AMGN\DEF-14A_2025-04-09.md'
Processed 87 new files. Errors: 5
Found 146 files to process in data\edgar_documents\AMT


2025-11-14 15:35:13,585 - INFO - Going to convert document batch...
2025-11-14 15:35:13,587 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:35:13,589 - INFO - Processing document 10-K_2023-02-23
2025-11-14 15:35:19,428 - INFO - Finished converting document 10-K_2023-02-23 in 9.47 sec.
2025-11-14 15:35:22,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-K_2023-02-23' --> 'data\processed_data\AMT\10-K_2023-02-23.md'


2025-11-14 15:35:24,761 - INFO - Going to convert document batch...
2025-11-14 15:35:24,762 - INFO - Processing document 10-K_2024-02-27
2025-11-14 15:35:30,733 - INFO - Finished converting document 10-K_2024-02-27 in 8.45 sec.
2025-11-14 15:35:33,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-K_2024-02-27' --> 'data\processed_data\AMT\10-K_2024-02-27.md'


2025-11-14 15:35:37,183 - INFO - Going to convert document batch...
2025-11-14 15:35:37,185 - INFO - Processing document 10-K_2025-02-25
2025-11-14 15:35:44,650 - INFO - Finished converting document 10-K_2025-02-25 in 11.69 sec.
2025-11-14 15:35:47,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-K_2025-02-25' --> 'data\processed_data\AMT\10-K_2025-02-25.md'


2025-11-14 15:35:48,702 - INFO - Going to convert document batch...
2025-11-14 15:35:48,703 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 15:35:50,954 - INFO - Finished converting document 10-Q_2023-04-26 in 3.81 sec.
2025-11-14 15:35:53,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2023-04-26' --> 'data\processed_data\AMT\10-Q_2023-04-26.md'


2025-11-14 15:35:55,303 - INFO - Going to convert document batch...
2025-11-14 15:35:55,305 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 15:35:59,173 - INFO - Finished converting document 10-Q_2023-07-27 in 5.81 sec.
2025-11-14 15:36:00,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2023-07-27' --> 'data\processed_data\AMT\10-Q_2023-07-27.md'


2025-11-14 15:36:02,747 - INFO - Going to convert document batch...
2025-11-14 15:36:02,748 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 15:36:06,894 - INFO - Finished converting document 10-Q_2023-10-26 in 6.25 sec.
2025-11-14 15:36:08,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2023-10-26' --> 'data\processed_data\AMT\10-Q_2023-10-26.md'


2025-11-14 15:36:09,483 - INFO - Going to convert document batch...
2025-11-14 15:36:09,485 - INFO - Processing document 10-Q_2024-04-30
2025-11-14 15:36:11,888 - INFO - Finished converting document 10-Q_2024-04-30 in 3.78 sec.
2025-11-14 15:36:13,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2024-04-30' --> 'data\processed_data\AMT\10-Q_2024-04-30.md'


2025-11-14 15:36:15,892 - INFO - Going to convert document batch...
2025-11-14 15:36:15,894 - INFO - Processing document 10-Q_2024-07-30
2025-11-14 15:36:18,786 - INFO - Finished converting document 10-Q_2024-07-30 in 5.62 sec.
2025-11-14 15:36:20,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2024-07-30' --> 'data\processed_data\AMT\10-Q_2024-07-30.md'


2025-11-14 15:36:22,810 - INFO - Going to convert document batch...
2025-11-14 15:36:22,811 - INFO - Processing document 10-Q_2024-10-29
2025-11-14 15:36:26,070 - INFO - Finished converting document 10-Q_2024-10-29 in 5.98 sec.
2025-11-14 15:36:27,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2024-10-29' --> 'data\processed_data\AMT\10-Q_2024-10-29.md'


2025-11-14 15:36:29,378 - INFO - Going to convert document batch...
2025-11-14 15:36:29,379 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 15:36:31,678 - INFO - Finished converting document 10-Q_2025-04-29 in 4.20 sec.
2025-11-14 15:36:32,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2025-04-29' --> 'data\processed_data\AMT\10-Q_2025-04-29.md'


2025-11-14 15:36:33,185 - INFO - Going to convert document batch...
2025-11-14 15:36:33,186 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 15:36:34,404 - INFO - Finished converting document 10-Q_2025-07-29 in 2.22 sec.
2025-11-14 15:36:34,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2025-07-29' --> 'data\processed_data\AMT\10-Q_2025-07-29.md'


2025-11-14 15:36:35,570 - INFO - Going to convert document batch...
2025-11-14 15:36:35,571 - INFO - Processing document 10-Q_2025-10-28
2025-11-14 15:36:37,060 - INFO - Finished converting document 10-Q_2025-10-28 in 2.11 sec.
2025-11-14 15:36:37,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,614 - INFO - Going to convert document batch...
2025-11-14 15:36:37,615 - INFO - Processing document 4_2023-01-04
2025-11-14 15:36:37,632 - INFO - Finished converting document 4_2023-01-04 in 0.03 sec.
2025-11-14 15:36:37,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,679 - INFO - Going to convert document batch...
2025-11-14 15:36:37,680 - INFO - Processing document 4_2023-01-05
2025-11-14 15:36:37,699 - INFO - Finished converting document 4_2023-01-05 in 0.05 sec.
2025-11-14 15:36:37,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,736 - INFO - Going to convert document batch...
2025-11-14 15:36:37,

Converted 'data\edgar_documents\AMT\10-Q_2025-10-28' --> 'data\processed_data\AMT\10-Q_2025-10-28.md'
Converted 'data\edgar_documents\AMT\4_2023-01-04' --> 'data\processed_data\AMT\4_2023-01-04.md'
Converted 'data\edgar_documents\AMT\4_2023-01-05' --> 'data\processed_data\AMT\4_2023-01-05.md'
Converted 'data\edgar_documents\AMT\4_2023-01-11' --> 'data\processed_data\AMT\4_2023-01-11.md'


2025-11-14 15:36:37,792 - INFO - Going to convert document batch...
2025-11-14 15:36:37,793 - INFO - Processing document 4_2023-01-18
2025-11-14 15:36:37,815 - INFO - Finished converting document 4_2023-01-18 in 0.05 sec.
2025-11-14 15:36:37,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,853 - INFO - Going to convert document batch...
2025-11-14 15:36:37,853 - INFO - Processing document 4_2023-01-19
2025-11-14 15:36:37,868 - INFO - Finished converting document 4_2023-01-19 in 0.03 sec.
2025-11-14 15:36:37,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,904 - INFO - Going to convert document batch...
2025-11-14 15:36:37,905 - INFO - Processing document 4_2023-02-06
2025-11-14 15:36:37,924 - INFO - Finished converting document 4_2023-02-06 in 0.03 sec.
2025-11-14 15:36:37,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,975 - INFO - Going to convert document batch...
2025-11-14 15:36:37,975 - 

Converted 'data\edgar_documents\AMT\4_2023-01-18' --> 'data\processed_data\AMT\4_2023-01-18.md'
Converted 'data\edgar_documents\AMT\4_2023-01-19' --> 'data\processed_data\AMT\4_2023-01-19.md'
Converted 'data\edgar_documents\AMT\4_2023-02-06' --> 'data\processed_data\AMT\4_2023-02-06.md'
Converted 'data\edgar_documents\AMT\4_2023-02-08' --> 'data\processed_data\AMT\4_2023-02-08.md'


2025-11-14 15:36:38,035 - INFO - Going to convert document batch...
2025-11-14 15:36:38,036 - INFO - Processing document 4_2023-02-28
2025-11-14 15:36:38,052 - INFO - Finished converting document 4_2023-02-28 in 0.03 sec.
2025-11-14 15:36:38,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,091 - INFO - Going to convert document batch...
2025-11-14 15:36:38,091 - INFO - Processing document 4_2023-03-01
2025-11-14 15:36:38,115 - INFO - Finished converting document 4_2023-03-01 in 0.05 sec.
2025-11-14 15:36:38,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,154 - INFO - Going to convert document batch...
2025-11-14 15:36:38,156 - INFO - Processing document 4_2023-03-14
2025-11-14 15:36:38,172 - INFO - Finished converting document 4_2023-03-14 in 0.03 sec.
2025-11-14 15:36:38,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,210 - INFO - Going to convert document batch...
2025-11-14 15:36:38,210 - 

Converted 'data\edgar_documents\AMT\4_2023-02-28' --> 'data\processed_data\AMT\4_2023-02-28.md'
Converted 'data\edgar_documents\AMT\4_2023-03-01' --> 'data\processed_data\AMT\4_2023-03-01.md'
Converted 'data\edgar_documents\AMT\4_2023-03-14' --> 'data\processed_data\AMT\4_2023-03-14.md'
Converted 'data\edgar_documents\AMT\4_2023-05-03' --> 'data\processed_data\AMT\4_2023-05-03.md'


2025-11-14 15:36:38,322 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:38,323 - ERROR - Input document 4_2023-05-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:38,325 - INFO - Going to convert document batch...
2025-11-14 15:36:38,352 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:38,352 - ERROR - Input document 4_2023-05-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AMT\4_2023-05-09: File format not allowed: data\edgar_documents\AMT\4_2023-05-09
Error processing data\edgar_documents\AMT\4_2023-05-10: File format not allowed: data\edgar_documents\AMT\4_2023-05-10
Error processing data\edgar_documents\AMT\4_2023-05-22: File format not allowed: data\edgar_documents\AMT\4_2023-05-22
Error processing data\edgar_documents\AMT\4_2023-05-23: File format not allowed: data\edgar_documents\AMT\4_2023-05-23
Converted 'data\edgar_documents\AMT\4_2023-05-24' --> 'data\processed_data\AMT\4_2023-05-24.md'


2025-11-14 15:36:38,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,532 - INFO - Going to convert document batch...
2025-11-14 15:36:38,532 - INFO - Processing document 4_2023-06-05
2025-11-14 15:36:38,549 - INFO - Finished converting document 4_2023-06-05 in 0.05 sec.
2025-11-14 15:36:38,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,588 - INFO - Going to convert document batch...
2025-11-14 15:36:38,589 - INFO - Processing document 4_2023-07-03
2025-11-14 15:36:38,606 - INFO - Finished converting document 4_2023-07-03 in 0.05 sec.
2025-11-14 15:36:38,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,646 - INFO - Going to convert document batch...
2025-11-14 15:36:38,646 - INFO - Processing document 4_2023-08-03
2025-11-14 15:36:38,663 - INFO - Finished converting document 4_2023-08-03 in 0.03 sec.
2025-11-14 15:36:38,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMT\4_2023-06-05' --> 'data\processed_data\AMT\4_2023-06-05.md'
Converted 'data\edgar_documents\AMT\4_2023-07-03' --> 'data\processed_data\AMT\4_2023-07-03.md'
Converted 'data\edgar_documents\AMT\4_2023-08-03' --> 'data\processed_data\AMT\4_2023-08-03.md'


2025-11-14 15:36:38,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,788 - INFO - Going to convert document batch...
2025-11-14 15:36:38,789 - INFO - Processing document 4_2023-08-14
2025-11-14 15:36:38,806 - INFO - Finished converting document 4_2023-08-14 in 0.03 sec.
2025-11-14 15:36:38,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,843 - INFO - Going to convert document batch...
2025-11-14 15:36:38,843 - INFO - Processing document 4_2023-08-17
2025-11-14 15:36:38,861 - INFO - Finished converting document 4_2023-08-17 in 0.03 sec.
2025-11-14 15:36:38,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,902 - INFO - Going to convert document batch...
2025-11-14 15:36:38,902 - INFO - Processing document 4_2023-08-21
2025-11-14 15:36:38,924 - INFO - Finished converting document 4_2023-08-21 in 0.05 sec.
2025-11-14 15:36:38,967 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\AMT\4_2023-08-07' --> 'data\processed_data\AMT\4_2023-08-07.md'
Converted 'data\edgar_documents\AMT\4_2023-08-14' --> 'data\processed_data\AMT\4_2023-08-14.md'
Converted 'data\edgar_documents\AMT\4_2023-08-17' --> 'data\processed_data\AMT\4_2023-08-17.md'
Converted 'data\edgar_documents\AMT\4_2023-08-21' --> 'data\processed_data\AMT\4_2023-08-21.md'


2025-11-14 15:36:38,968 - ERROR - Input document 4_2023-09-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:38,969 - INFO - Going to convert document batch...
2025-11-14 15:36:38,993 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:38,994 - ERROR - Input document 4_2023-09-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\AMT\4_2023-09-12: File format not allowed: data\edgar_documents\AMT\4_2023-09-12
Error processing data\edgar_documents\AMT\4_2023-09-13: File format not allowed: data\edgar_documents\AMT\4_2023-09-13
Converted 'data\edgar_documents\AMT\4_2023-10-04' --> 'data\processed_data\AMT\4_2023-10-04.md'
Converted 'data\edgar_documents\AMT\4_2023-10-18' --> 'data\processed_data\AMT\4_2023-10-18.md'
Error processing data\edgar_documents\AMT\4_2023-10-27: File format not allowed: data\edgar_documents\AMT\4_2023-10-27


2025-11-14 15:36:39,168 - INFO - Finished converting document 4_2023-11-13 in 0.05 sec.
2025-11-14 15:36:39,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,208 - INFO - Going to convert document batch...
2025-11-14 15:36:39,209 - INFO - Processing document 4_2024-02-28
2025-11-14 15:36:39,228 - INFO - Finished converting document 4_2024-02-28 in 0.03 sec.
2025-11-14 15:36:39,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,266 - INFO - Going to convert document batch...
2025-11-14 15:36:39,267 - INFO - Processing document 4_2024-03-01
2025-11-14 15:36:39,286 - INFO - Finished converting document 4_2024-03-01 in 0.03 sec.
2025-11-14 15:36:39,329 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:39,330 - ERROR - Input document 4_2024-03-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFo

Converted 'data\edgar_documents\AMT\4_2023-11-13' --> 'data\processed_data\AMT\4_2023-11-13.md'
Converted 'data\edgar_documents\AMT\4_2024-02-28' --> 'data\processed_data\AMT\4_2024-02-28.md'
Converted 'data\edgar_documents\AMT\4_2024-03-01' --> 'data\processed_data\AMT\4_2024-03-01.md'
Error processing data\edgar_documents\AMT\4_2024-03-04: File format not allowed: data\edgar_documents\AMT\4_2024-03-04


2025-11-14 15:36:39,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,414 - INFO - Going to convert document batch...
2025-11-14 15:36:39,415 - INFO - Processing document 4_2024-03-06
2025-11-14 15:36:39,439 - INFO - Finished converting document 4_2024-03-06 in 0.05 sec.
2025-11-14 15:36:39,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,481 - INFO - Going to convert document batch...
2025-11-14 15:36:39,482 - INFO - Processing document 4_2024-03-08
2025-11-14 15:36:39,505 - INFO - Finished converting document 4_2024-03-08 in 0.05 sec.
2025-11-14 15:36:39,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,545 - INFO - Going to convert document batch...
2025-11-14 15:36:39,545 - INFO - Processing document 4_2024-03-12
2025-11-14 15:36:39,562 - INFO - Finished converting document 4_2024-03-12 in 0.03 sec.


Converted 'data\edgar_documents\AMT\4_2024-03-05' --> 'data\processed_data\AMT\4_2024-03-05.md'
Converted 'data\edgar_documents\AMT\4_2024-03-06' --> 'data\processed_data\AMT\4_2024-03-06.md'
Converted 'data\edgar_documents\AMT\4_2024-03-08' --> 'data\processed_data\AMT\4_2024-03-08.md'
Converted 'data\edgar_documents\AMT\4_2024-03-12' --> 'data\processed_data\AMT\4_2024-03-12.md'


2025-11-14 15:36:39,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,619 - INFO - Going to convert document batch...
2025-11-14 15:36:39,619 - INFO - Processing document 4_2024-03-19
2025-11-14 15:36:39,640 - INFO - Finished converting document 4_2024-03-19 in 0.06 sec.
2025-11-14 15:36:39,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,679 - INFO - Going to convert document batch...
2025-11-14 15:36:39,680 - INFO - Processing document 4_2024-05-03
2025-11-14 15:36:39,696 - INFO - Finished converting document 4_2024-05-03 in 0.03 sec.
2025-11-14 15:36:39,727 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,734 - INFO - Going to convert document batch...
2025-11-14 15:36:39,735 - INFO - Processing document 4_2024-05-07
2025-11-14 15:36:39,751 - INFO - Finished converting document 4_2024-05-07 in 0.03 sec.
2025-11-14 15:36:39,793 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMT\4_2024-03-19' --> 'data\processed_data\AMT\4_2024-03-19.md'
Converted 'data\edgar_documents\AMT\4_2024-05-03' --> 'data\processed_data\AMT\4_2024-05-03.md'
Converted 'data\edgar_documents\AMT\4_2024-05-07' --> 'data\processed_data\AMT\4_2024-05-07.md'
Converted 'data\edgar_documents\AMT\4_2024-05-22' --> 'data\processed_data\AMT\4_2024-05-22.md'


2025-11-14 15:36:39,862 - ERROR - Input document 4_2024-05-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:39,863 - INFO - Going to convert document batch...
2025-11-14 15:36:39,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,883 - INFO - Going to convert document batch...
2025-11-14 15:36:39,884 - INFO - Processing document 4_2024-06-04
2025-11-14 15:36:39,901 - INFO - Finished converting document 4_2024-06-04 in 0.05 sec.
2025-11-14 15:36:39,934 - INFO - detec

Error processing data\edgar_documents\AMT\4_2024-05-23: File format not allowed: data\edgar_documents\AMT\4_2024-05-23
Converted 'data\edgar_documents\AMT\4_2024-06-04' --> 'data\processed_data\AMT\4_2024-06-04.md'
Converted 'data\edgar_documents\AMT\4_2024-06-06' --> 'data\processed_data\AMT\4_2024-06-06.md'
Converted 'data\edgar_documents\AMT\4_2024-08-06' --> 'data\processed_data\AMT\4_2024-08-06.md'


2025-11-14 15:36:40,072 - INFO - Going to convert document batch...
2025-11-14 15:36:40,073 - INFO - Processing document 4_2024-08-28
2025-11-14 15:36:40,094 - INFO - Finished converting document 4_2024-08-28 in 0.05 sec.
2025-11-14 15:36:40,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,174 - INFO - Going to convert document batch...
2025-11-14 15:36:40,175 - INFO - Processing document 4_2024-09-05
2025-11-14 15:36:40,216 - INFO - Finished converting document 4_2024-09-05 in 0.09 sec.
2025-11-14 15:36:40,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,273 - INFO - Going to convert document batch...
2025-11-14 15:36:40,274 - INFO - Processing document 4_2024-09-12
2025-11-14 15:36:40,295 - INFO - Finished converting document 4_2024-09-12 in 0.06 sec.


Converted 'data\edgar_documents\AMT\4_2024-08-28' --> 'data\processed_data\AMT\4_2024-08-28.md'
Converted 'data\edgar_documents\AMT\4_2024-09-05' --> 'data\processed_data\AMT\4_2024-09-05.md'


2025-11-14 15:36:40,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,335 - INFO - Going to convert document batch...
2025-11-14 15:36:40,336 - INFO - Processing document 4_2024-09-17
2025-11-14 15:36:40,353 - INFO - Finished converting document 4_2024-09-17 in 0.03 sec.
2025-11-14 15:36:40,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,392 - INFO - Going to convert document batch...
2025-11-14 15:36:40,393 - INFO - Processing document 4_2024-10-03
2025-11-14 15:36:40,410 - INFO - Finished converting document 4_2024-10-03 in 0.03 sec.
2025-11-14 15:36:40,451 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:40,452 - ERROR - Input document 4_2024-11-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\AMT\4_2024-09-12' --> 'data\processed_data\AMT\4_2024-09-12.md'
Converted 'data\edgar_documents\AMT\4_2024-09-17' --> 'data\processed_data\AMT\4_2024-09-17.md'
Converted 'data\edgar_documents\AMT\4_2024-10-03' --> 'data\processed_data\AMT\4_2024-10-03.md'
Error processing data\edgar_documents\AMT\4_2024-11-18: File format not allowed: data\edgar_documents\AMT\4_2024-11-18
Error processing data\edgar_documents\AMT\4_2024-11-19: File format not allowed: data\edgar_documents\AMT\4_2024-11-19


2025-11-14 15:36:40,503 - INFO - Going to convert document batch...
2025-11-14 15:36:40,504 - INFO - Processing document 4_2025-01-07
2025-11-14 15:36:40,524 - INFO - Finished converting document 4_2025-01-07 in 0.03 sec.
2025-11-14 15:36:40,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,565 - INFO - Going to convert document batch...
2025-11-14 15:36:40,566 - INFO - Processing document 4_2025-01-17
2025-11-14 15:36:40,591 - INFO - Finished converting document 4_2025-01-17 in 0.05 sec.
2025-11-14 15:36:40,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,638 - INFO - Going to convert document batch...
2025-11-14 15:36:40,639 - INFO - Processing document 4_2025-02-18
2025-11-14 15:36:40,661 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 15:36:40,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,701 - INFO - Going to convert document batch...
2025-11-14 15:36:40,702 - 

Converted 'data\edgar_documents\AMT\4_2025-01-07' --> 'data\processed_data\AMT\4_2025-01-07.md'
Converted 'data\edgar_documents\AMT\4_2025-01-17' --> 'data\processed_data\AMT\4_2025-01-17.md'
Converted 'data\edgar_documents\AMT\4_2025-02-18' --> 'data\processed_data\AMT\4_2025-02-18.md'


2025-11-14 15:36:40,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,758 - INFO - Going to convert document batch...
2025-11-14 15:36:40,759 - INFO - Processing document 4_2025-03-03
2025-11-14 15:36:40,776 - INFO - Finished converting document 4_2025-03-03 in 0.05 sec.
2025-11-14 15:36:40,821 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:40,822 - ERROR - Input document 4_2025-03-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36

Converted 'data\edgar_documents\AMT\4_2025-02-28' --> 'data\processed_data\AMT\4_2025-02-28.md'
Converted 'data\edgar_documents\AMT\4_2025-03-03' --> 'data\processed_data\AMT\4_2025-03-03.md'
Error processing data\edgar_documents\AMT\4_2025-03-11: File format not allowed: data\edgar_documents\AMT\4_2025-03-11
Converted 'data\edgar_documents\AMT\4_2025-03-12' --> 'data\processed_data\AMT\4_2025-03-12.md'


2025-11-14 15:36:40,927 - INFO - Finished converting document 4_2025-03-19 in 0.03 sec.
2025-11-14 15:36:40,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,978 - INFO - Going to convert document batch...
2025-11-14 15:36:40,980 - INFO - Processing document 4_2025-04-02
2025-11-14 15:36:41,008 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.
2025-11-14 15:36:41,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,056 - INFO - Going to convert document batch...
2025-11-14 15:36:41,057 - INFO - Processing document 4_2025-05-16
2025-11-14 15:36:41,075 - INFO - Finished converting document 4_2025-05-16 in 0.05 sec.


Converted 'data\edgar_documents\AMT\4_2025-03-19' --> 'data\processed_data\AMT\4_2025-03-19.md'
Converted 'data\edgar_documents\AMT\4_2025-04-02' --> 'data\processed_data\AMT\4_2025-04-02.md'
Converted 'data\edgar_documents\AMT\4_2025-05-16' --> 'data\processed_data\AMT\4_2025-05-16.md'


2025-11-14 15:36:41,132 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:41,132 - ERROR - Input document 4_2025-05-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:41,134 - INFO - Going to convert document batch...
2025-11-14 15:36:41,160 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:41,161 - ERROR - Input document 4_2025-05-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AMT\4_2025-05-21: File format not allowed: data\edgar_documents\AMT\4_2025-05-21
Error processing data\edgar_documents\AMT\4_2025-05-22: File format not allowed: data\edgar_documents\AMT\4_2025-05-22
Converted 'data\edgar_documents\AMT\4_2025-06-03' --> 'data\processed_data\AMT\4_2025-06-03.md'
Converted 'data\edgar_documents\AMT\4_2025-08-01' --> 'data\processed_data\AMT\4_2025-08-01.md'
Error processing data\edgar_documents\AMT\4_2025-09-11: File format not allowed: data\edgar_documents\AMT\4_2025-09-11


2025-11-14 15:36:41,334 - ERROR - Input document 4_2025-09-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:41,336 - INFO - Going to convert document batch...
2025-11-14 15:36:41,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,357 - INFO - Going to convert document batch...
2025-11-14 15:36:41,358 - INFO - Processing document 4_2025-09-23
2025-11-14 15:36:41,377 - INFO - Finished converting document 4_2025-09-23 in 0.05 sec.
2025-11-14 15:36:41,408 - INFO - detec

Error processing data\edgar_documents\AMT\4_2025-09-12: File format not allowed: data\edgar_documents\AMT\4_2025-09-12
Converted 'data\edgar_documents\AMT\4_2025-09-23' --> 'data\processed_data\AMT\4_2025-09-23.md'
Converted 'data\edgar_documents\AMT\4_2025-10-03' --> 'data\processed_data\AMT\4_2025-10-03.md'


2025-11-14 15:36:41,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,551 - INFO - Going to convert document batch...
2025-11-14 15:36:41,552 - INFO - Processing document 8-K_2023-02-23
2025-11-14 15:36:41,572 - INFO - Finished converting document 8-K_2023-02-23 in 0.05 sec.
2025-11-14 15:36:41,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,612 - INFO - Going to convert document batch...
2025-11-14 15:36:41,613 - INFO - Processing document 8-K_2023-03-01
2025-11-14 15:36:41,634 - INFO - Finished converting document 8-K_2023-03-01 in 0.05 sec.
2025-11-14 15:36:41,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,676 - INFO - Going to convert document batch...
2025-11-14 15:36:41,677 - INFO - Processing document 8-K_2023-03-02
2025-11-14 15:36:41,699 - INFO - Finished converting document 8-K_2023-03-02 in 0.06 sec.


Converted 'data\edgar_documents\AMT\4_2025-11-04' --> 'data\processed_data\AMT\4_2025-11-04.md'
Converted 'data\edgar_documents\AMT\8-K_2023-02-23' --> 'data\processed_data\AMT\8-K_2023-02-23.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-01' --> 'data\processed_data\AMT\8-K_2023-03-01.md'


2025-11-14 15:36:41,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,744 - INFO - Going to convert document batch...
2025-11-14 15:36:41,745 - INFO - Processing document 8-K_2023-03-03
2025-11-14 15:36:41,769 - INFO - Finished converting document 8-K_2023-03-03 in 0.05 sec.
2025-11-14 15:36:41,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,811 - INFO - Going to convert document batch...
2025-11-14 15:36:41,812 - INFO - Processing document 8-K_2023-03-08
2025-11-14 15:36:41,832 - INFO - Finished converting document 8-K_2023-03-08 in 0.05 sec.
2025-11-14 15:36:41,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,873 - INFO - Going to convert document batch...
2025-11-14 15:36:41,874 - INFO - Processing document 8-K_2023-03-09
2025-11-14 15:36:41,896 - INFO - Finished converting document 8-K_2023-03-09 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-03-02' --> 'data\processed_data\AMT\8-K_2023-03-02.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-03' --> 'data\processed_data\AMT\8-K_2023-03-03.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-08' --> 'data\processed_data\AMT\8-K_2023-03-08.md'


2025-11-14 15:36:41,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,938 - INFO - Going to convert document batch...
2025-11-14 15:36:41,939 - INFO - Processing document 8-K_2023-03-13
2025-11-14 15:36:41,960 - INFO - Finished converting document 8-K_2023-03-13 in 0.05 sec.
2025-11-14 15:36:41,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,998 - INFO - Going to convert document batch...
2025-11-14 15:36:41,999 - INFO - Processing document 8-K_2023-03-31
2025-11-14 15:36:42,017 - INFO - Finished converting document 8-K_2023-03-31 in 0.05 sec.
2025-11-14 15:36:42,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,056 - INFO - Going to convert document batch...
2025-11-14 15:36:42,057 - INFO - Processing document 8-K_2023-04-26
2025-11-14 15:36:42,078 - INFO - Finished converting document 8-K_2023-04-26 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-03-09' --> 'data\processed_data\AMT\8-K_2023-03-09.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-13' --> 'data\processed_data\AMT\8-K_2023-03-13.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-31' --> 'data\processed_data\AMT\8-K_2023-03-31.md'
Converted 'data\edgar_documents\AMT\8-K_2023-04-26' --> 'data\processed_data\AMT\8-K_2023-04-26.md'


2025-11-14 15:36:42,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,143 - INFO - Going to convert document batch...
2025-11-14 15:36:42,144 - INFO - Processing document 8-K_2023-05-09
2025-11-14 15:36:42,164 - INFO - Finished converting document 8-K_2023-05-09 in 0.06 sec.
2025-11-14 15:36:42,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,203 - INFO - Going to convert document batch...
2025-11-14 15:36:42,205 - INFO - Processing document 8-K_2023-05-16
2025-11-14 15:36:42,226 - INFO - Finished converting document 8-K_2023-05-16 in 0.05 sec.
2025-11-14 15:36:42,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,266 - INFO - Going to convert document batch...
2025-11-14 15:36:42,267 - INFO - Processing document 8-K_2023-05-22
2025-11-14 15:36:42,288 - INFO - Finished converting document 8-K_2023-05-22 in 0.05 sec.
2025-11-14 15:36:42,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\AMT\8-K_2023-05-09' --> 'data\processed_data\AMT\8-K_2023-05-09.md'
Converted 'data\edgar_documents\AMT\8-K_2023-05-16' --> 'data\processed_data\AMT\8-K_2023-05-16.md'
Converted 'data\edgar_documents\AMT\8-K_2023-05-22' --> 'data\processed_data\AMT\8-K_2023-05-22.md'


2025-11-14 15:36:42,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,980 - INFO - Going to convert document batch...
2025-11-14 15:36:42,981 - INFO - Processing document 8-K_2023-06-29
2025-11-14 15:36:43,003 - INFO - Finished converting document 8-K_2023-06-29 in 0.17 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-05-25' --> 'data\processed_data\AMT\8-K_2023-05-25.md'


2025-11-14 15:36:43,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,044 - INFO - Going to convert document batch...
2025-11-14 15:36:43,045 - INFO - Processing document 8-K_2023-07-20
2025-11-14 15:36:43,067 - INFO - Finished converting document 8-K_2023-07-20 in 0.05 sec.
2025-11-14 15:36:43,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,180 - INFO - Going to convert document batch...
2025-11-14 15:36:43,181 - INFO - Processing document 8-K_2023-07-27
2025-11-14 15:36:43,201 - INFO - Finished converting document 8-K_2023-07-27 in 0.12 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-06-29' --> 'data\processed_data\AMT\8-K_2023-06-29.md'
Converted 'data\edgar_documents\AMT\8-K_2023-07-20' --> 'data\processed_data\AMT\8-K_2023-07-20.md'


2025-11-14 15:36:43,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,243 - INFO - Going to convert document batch...
2025-11-14 15:36:43,243 - INFO - Processing document 8-K_2023-09-12
2025-11-14 15:36:43,266 - INFO - Finished converting document 8-K_2023-09-12 in 0.05 sec.
2025-11-14 15:36:43,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,306 - INFO - Going to convert document batch...
2025-11-14 15:36:43,306 - INFO - Processing document 8-K_2023-09-15
2025-11-14 15:36:43,330 - INFO - Finished converting document 8-K_2023-09-15 in 0.05 sec.
2025-11-14 15:36:43,355 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,370 - INFO - Going to convert document batch...
2025-11-14 15:36:43,371 - INFO - Processing document 8-K_2023-09-20
2025-11-14 15:36:43,392 - INFO - Finished converting document 8-K_2023-09-20 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-07-27' --> 'data\processed_data\AMT\8-K_2023-07-27.md'
Converted 'data\edgar_documents\AMT\8-K_2023-09-12' --> 'data\processed_data\AMT\8-K_2023-09-12.md'
Converted 'data\edgar_documents\AMT\8-K_2023-09-15' --> 'data\processed_data\AMT\8-K_2023-09-15.md'
Converted 'data\edgar_documents\AMT\8-K_2023-09-20' --> 'data\processed_data\AMT\8-K_2023-09-20.md'


2025-11-14 15:36:43,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,454 - INFO - Going to convert document batch...
2025-11-14 15:36:43,455 - INFO - Processing document 8-K_2023-10-26
2025-11-14 15:36:43,487 - INFO - Finished converting document 8-K_2023-10-26 in 0.08 sec.
2025-11-14 15:36:43,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,539 - INFO - Going to convert document batch...
2025-11-14 15:36:43,540 - INFO - Processing document 8-K_2023-12-14
2025-11-14 15:36:43,564 - INFO - Finished converting document 8-K_2023-12-14 in 0.06 sec.
2025-11-14 15:36:43,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,606 - INFO - Going to convert document batch...
2025-11-14 15:36:43,607 - INFO - Processing document 8-K_2024-01-05
2025-11-14 15:36:43,630 - INFO - Finished converting document 8-K_2024-01-05 in 0.05 sec.
2025-11-14 15:36:43,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\AMT\8-K_2023-10-26' --> 'data\processed_data\AMT\8-K_2023-10-26.md'
Converted 'data\edgar_documents\AMT\8-K_2023-12-14' --> 'data\processed_data\AMT\8-K_2023-12-14.md'
Converted 'data\edgar_documents\AMT\8-K_2024-01-05' --> 'data\processed_data\AMT\8-K_2024-01-05.md'


2025-11-14 15:36:43,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,733 - INFO - Going to convert document batch...
2025-11-14 15:36:43,734 - INFO - Processing document 8-K_2024-02-27
2025-11-14 15:36:43,757 - INFO - Finished converting document 8-K_2024-02-27 in 0.05 sec.
2025-11-14 15:36:43,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,794 - INFO - Going to convert document batch...
2025-11-14 15:36:43,795 - INFO - Processing document 8-K_2024-03-01
2025-11-14 15:36:43,819 - INFO - Finished converting document 8-K_2024-03-01 in 0.05 sec.
2025-11-14 15:36:43,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,858 - INFO - Going to convert document batch...
2025-11-14 15:36:43,859 - INFO - Processing document 8-K_2024-03-04
2025-11-14 15:36:43,882 - INFO - Finished converting document 8-K_2024-03-04 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-02-07' --> 'data\processed_data\AMT\8-K_2024-02-07.md'
Converted 'data\edgar_documents\AMT\8-K_2024-02-27' --> 'data\processed_data\AMT\8-K_2024-02-27.md'
Converted 'data\edgar_documents\AMT\8-K_2024-03-01' --> 'data\processed_data\AMT\8-K_2024-03-01.md'


2025-11-14 15:36:43,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,923 - INFO - Going to convert document batch...
2025-11-14 15:36:43,923 - INFO - Processing document 8-K_2024-03-07
2025-11-14 15:36:43,949 - INFO - Finished converting document 8-K_2024-03-07 in 0.06 sec.
2025-11-14 15:36:43,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,988 - INFO - Going to convert document batch...
2025-11-14 15:36:43,989 - INFO - Processing document 8-K_2024-03-14
2025-11-14 15:36:44,014 - INFO - Finished converting document 8-K_2024-03-14 in 0.06 sec.
2025-11-14 15:36:44,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,055 - INFO - Going to convert document batch...
2025-11-14 15:36:44,056 - INFO - Processing document 8-K_2024-04-30
2025-11-14 15:36:44,079 - INFO - Finished converting document 8-K_2024-04-30 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-03-04' --> 'data\processed_data\AMT\8-K_2024-03-04.md'
Converted 'data\edgar_documents\AMT\8-K_2024-03-07' --> 'data\processed_data\AMT\8-K_2024-03-07.md'
Converted 'data\edgar_documents\AMT\8-K_2024-03-14' --> 'data\processed_data\AMT\8-K_2024-03-14.md'


2025-11-14 15:36:44,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,115 - INFO - Going to convert document batch...
2025-11-14 15:36:44,116 - INFO - Processing document 8-K_2024-05-22
2025-11-14 15:36:44,140 - INFO - Finished converting document 8-K_2024-05-22 in 0.05 sec.
2025-11-14 15:36:44,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,184 - INFO - Going to convert document batch...
2025-11-14 15:36:44,185 - INFO - Processing document 8-K_2024-05-24
2025-11-14 15:36:44,220 - INFO - Finished converting document 8-K_2024-05-24 in 0.06 sec.
2025-11-14 15:36:44,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,268 - INFO - Going to convert document batch...
2025-11-14 15:36:44,268 - INFO - Processing document 8-K_2024-05-29
2025-11-14 15:36:44,291 - INFO - Finished converting document 8-K_2024-05-29 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-04-30' --> 'data\processed_data\AMT\8-K_2024-04-30.md'
Converted 'data\edgar_documents\AMT\8-K_2024-05-22' --> 'data\processed_data\AMT\8-K_2024-05-22.md'
Converted 'data\edgar_documents\AMT\8-K_2024-05-24' --> 'data\processed_data\AMT\8-K_2024-05-24.md'


2025-11-14 15:36:44,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,331 - INFO - Going to convert document batch...
2025-11-14 15:36:44,332 - INFO - Processing document 8-K_2024-07-30
2025-11-14 15:36:44,358 - INFO - Finished converting document 8-K_2024-07-30 in 0.06 sec.
2025-11-14 15:36:44,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,397 - INFO - Going to convert document batch...
2025-11-14 15:36:44,397 - INFO - Processing document 8-K_2024-09-12
2025-11-14 15:36:44,418 - INFO - Finished converting document 8-K_2024-09-12 in 0.06 sec.
2025-11-14 15:36:44,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,459 - INFO - Going to convert document batch...
2025-11-14 15:36:44,460 - INFO - Processing document 8-K_2024-10-29
2025-11-14 15:36:44,482 - INFO - Finished converting document 8-K_2024-10-29 in 0.06 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-05-29' --> 'data\processed_data\AMT\8-K_2024-05-29.md'
Converted 'data\edgar_documents\AMT\8-K_2024-07-30' --> 'data\processed_data\AMT\8-K_2024-07-30.md'
Converted 'data\edgar_documents\AMT\8-K_2024-09-12' --> 'data\processed_data\AMT\8-K_2024-09-12.md'


2025-11-14 15:36:44,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,522 - INFO - Going to convert document batch...
2025-11-14 15:36:44,523 - INFO - Processing document 8-K_2024-10-31
2025-11-14 15:36:44,543 - INFO - Finished converting document 8-K_2024-10-31 in 0.05 sec.
2025-11-14 15:36:44,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,580 - INFO - Going to convert document batch...
2025-11-14 15:36:44,580 - INFO - Processing document 8-K_2024-11-19
2025-11-14 15:36:44,604 - INFO - Finished converting document 8-K_2024-11-19 in 0.05 sec.
2025-11-14 15:36:44,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,646 - INFO - Going to convert document batch...
2025-11-14 15:36:44,647 - INFO - Processing document 8-K_2024-11-21
2025-11-14 15:36:44,673 - INFO - Finished converting document 8-K_2024-11-21 in 0.06 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-10-29' --> 'data\processed_data\AMT\8-K_2024-10-29.md'
Converted 'data\edgar_documents\AMT\8-K_2024-10-31' --> 'data\processed_data\AMT\8-K_2024-10-31.md'
Converted 'data\edgar_documents\AMT\8-K_2024-11-19' --> 'data\processed_data\AMT\8-K_2024-11-19.md'


2025-11-14 15:36:44,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,712 - INFO - Going to convert document batch...
2025-11-14 15:36:44,712 - INFO - Processing document 8-K_2024-12-05
2025-11-14 15:36:44,740 - INFO - Finished converting document 8-K_2024-12-05 in 0.05 sec.
2025-11-14 15:36:44,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,801 - INFO - Going to convert document batch...
2025-11-14 15:36:44,804 - INFO - Processing document 8-K_2025-01-07
2025-11-14 15:36:44,855 - INFO - Finished converting document 8-K_2025-01-07 in 0.11 sec.
2025-11-14 15:36:44,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\8-K_2024-11-21' --> 'data\processed_data\AMT\8-K_2024-11-21.md'
Converted 'data\edgar_documents\AMT\8-K_2024-12-05' --> 'data\processed_data\AMT\8-K_2024-12-05.md'
Converted 'data\edgar_documents\AMT\8-K_2025-01-07' --> 'data\processed_data\AMT\8-K_2025-01-07.md'


2025-11-14 15:36:44,902 - INFO - Going to convert document batch...
2025-11-14 15:36:44,904 - INFO - Processing document 8-K_2025-01-28
2025-11-14 15:36:44,925 - INFO - Finished converting document 8-K_2025-01-28 in 0.06 sec.
2025-11-14 15:36:44,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,960 - INFO - Going to convert document batch...
2025-11-14 15:36:44,960 - INFO - Processing document 8-K_2025-02-05
2025-11-14 15:36:44,993 - INFO - Finished converting document 8-K_2025-02-05 in 0.05 sec.
2025-11-14 15:36:45,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,033 - INFO - Going to convert document batch...
2025-11-14 15:36:45,033 - INFO - Processing document 8-K_2025-02-25
2025-11-14 15:36:45,056 - INFO - Finished converting document 8-K_2025-02-25 in 0.05 sec.
2025-11-14 15:36:45,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,094 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\AMT\8-K_2025-01-28' --> 'data\processed_data\AMT\8-K_2025-01-28.md'
Converted 'data\edgar_documents\AMT\8-K_2025-02-05' --> 'data\processed_data\AMT\8-K_2025-02-05.md'
Converted 'data\edgar_documents\AMT\8-K_2025-02-25' --> 'data\processed_data\AMT\8-K_2025-02-25.md'


2025-11-14 15:36:45,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,162 - INFO - Going to convert document batch...
2025-11-14 15:36:45,163 - INFO - Processing document 8-K_2025-03-06
2025-11-14 15:36:45,189 - INFO - Finished converting document 8-K_2025-03-06 in 0.06 sec.
2025-11-14 15:36:45,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,226 - INFO - Going to convert document batch...
2025-11-14 15:36:45,227 - INFO - Processing document 8-K_2025-03-11
2025-11-14 15:36:45,248 - INFO - Finished converting document 8-K_2025-03-11 in 0.05 sec.
2025-11-14 15:36:45,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,288 - INFO - Going to convert document batch...
2025-11-14 15:36:45,288 - INFO - Processing document 8-K_2025-03-14


Converted 'data\edgar_documents\AMT\8-K_2025-03-05' --> 'data\processed_data\AMT\8-K_2025-03-05.md'
Converted 'data\edgar_documents\AMT\8-K_2025-03-06' --> 'data\processed_data\AMT\8-K_2025-03-06.md'
Converted 'data\edgar_documents\AMT\8-K_2025-03-11' --> 'data\processed_data\AMT\8-K_2025-03-11.md'


2025-11-14 15:36:45,314 - INFO - Finished converting document 8-K_2025-03-14 in 0.06 sec.
2025-11-14 15:36:45,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,355 - INFO - Going to convert document batch...
2025-11-14 15:36:45,355 - INFO - Processing document 8-K_2025-03-20
2025-11-14 15:36:45,374 - INFO - Finished converting document 8-K_2025-03-20 in 0.05 sec.
2025-11-14 15:36:45,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,410 - INFO - Going to convert document batch...
2025-11-14 15:36:45,411 - INFO - Processing document 8-K_2025-04-29
2025-11-14 15:36:45,433 - INFO - Finished converting document 8-K_2025-04-29 in 0.05 sec.
2025-11-14 15:36:45,460 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,479 - INFO - Going to convert document batch...
2025-11-14 15:36:45,481 - INFO - Processing document 8-K_2025-05-15


Converted 'data\edgar_documents\AMT\8-K_2025-03-14' --> 'data\processed_data\AMT\8-K_2025-03-14.md'
Converted 'data\edgar_documents\AMT\8-K_2025-03-20' --> 'data\processed_data\AMT\8-K_2025-03-20.md'
Converted 'data\edgar_documents\AMT\8-K_2025-04-29' --> 'data\processed_data\AMT\8-K_2025-04-29.md'


2025-11-14 15:36:45,524 - INFO - Finished converting document 8-K_2025-05-15 in 0.08 sec.
2025-11-14 15:36:45,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,601 - INFO - Going to convert document batch...
2025-11-14 15:36:45,603 - INFO - Processing document 8-K_2025-05-21
2025-11-14 15:36:45,633 - INFO - Finished converting document 8-K_2025-05-21 in 0.08 sec.
2025-11-14 15:36:45,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,679 - INFO - Going to convert document batch...
2025-11-14 15:36:45,679 - INFO - Processing document 8-K_2025-05-30
2025-11-14 15:36:45,701 - INFO - Finished converting document 8-K_2025-05-30 in 0.06 sec.
2025-11-14 15:36:45,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,741 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMT\8-K_2025-05-15' --> 'data\processed_data\AMT\8-K_2025-05-15.md'
Converted 'data\edgar_documents\AMT\8-K_2025-05-21' --> 'data\processed_data\AMT\8-K_2025-05-21.md'
Converted 'data\edgar_documents\AMT\8-K_2025-05-30' --> 'data\processed_data\AMT\8-K_2025-05-30.md'


2025-11-14 15:36:45,742 - INFO - Processing document 8-K_2025-07-29
2025-11-14 15:36:45,764 - INFO - Finished converting document 8-K_2025-07-29 in 0.05 sec.
2025-11-14 15:36:45,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\8-K_2025-07-29' --> 'data\processed_data\AMT\8-K_2025-07-29.md'


2025-11-14 15:36:46,041 - INFO - Going to convert document batch...
2025-11-14 15:36:46,042 - INFO - Processing document 8-K_2025-08-25
2025-11-14 15:36:46,066 - INFO - Finished converting document 8-K_2025-08-25 in 0.28 sec.
2025-11-14 15:36:46,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,105 - INFO - Going to convert document batch...
2025-11-14 15:36:46,106 - INFO - Processing document 8-K_2025-09-05
2025-11-14 15:36:46,125 - INFO - Finished converting document 8-K_2025-09-05 in 0.05 sec.
2025-11-14 15:36:46,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,185 - INFO - Going to convert document batch...
2025-11-14 15:36:46,186 - INFO - Processing document 8-K_2025-09-11
2025-11-14 15:36:46,207 - INFO - Finished converting document 8-K_2025-09-11 in 0.06 sec.
2025-11-14 15:36:46,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,248 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\AMT\8-K_2025-08-25' --> 'data\processed_data\AMT\8-K_2025-08-25.md'
Converted 'data\edgar_documents\AMT\8-K_2025-09-05' --> 'data\processed_data\AMT\8-K_2025-09-05.md'
Converted 'data\edgar_documents\AMT\8-K_2025-09-11' --> 'data\processed_data\AMT\8-K_2025-09-11.md'


2025-11-14 15:36:46,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,311 - INFO - Going to convert document batch...
2025-11-14 15:36:46,312 - INFO - Processing document 8-K_2025-09-18
2025-11-14 15:36:46,349 - INFO - Finished converting document 8-K_2025-09-18 in 0.06 sec.
2025-11-14 15:36:46,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,395 - INFO - Going to convert document batch...
2025-11-14 15:36:46,396 - INFO - Processing document 8-K_2025-09-24
2025-11-14 15:36:46,414 - INFO - Finished converting document 8-K_2025-09-24 in 0.05 sec.
2025-11-14 15:36:46,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,450 - INFO - Going to convert document batch...
2025-11-14 15:36:46,450 - INFO - Processing document 8-K_2025-10-28
2025-11-14 15:36:46,471 - INFO - Finished converting document 8-K_2025-10-28 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2025-09-16' --> 'data\processed_data\AMT\8-K_2025-09-16.md'
Converted 'data\edgar_documents\AMT\8-K_2025-09-18' --> 'data\processed_data\AMT\8-K_2025-09-18.md'
Converted 'data\edgar_documents\AMT\8-K_2025-09-24' --> 'data\processed_data\AMT\8-K_2025-09-24.md'


2025-11-14 15:36:46,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,508 - INFO - Going to convert document batch...
2025-11-14 15:36:46,509 - INFO - Processing document 8-K_2025-11-07
2025-11-14 15:36:46,527 - INFO - Finished converting document 8-K_2025-11-07 in 0.05 sec.
2025-11-14 15:36:46,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\8-K_2025-10-28' --> 'data\processed_data\AMT\8-K_2025-10-28.md'
Converted 'data\edgar_documents\AMT\8-K_2025-11-07' --> 'data\processed_data\AMT\8-K_2025-11-07.md'


2025-11-14 15:36:46,982 - INFO - Going to convert document batch...
2025-11-14 15:36:46,983 - INFO - Processing document DEF-14A_2023-04-12
2025-11-14 15:36:48,897 - INFO - Finished converting document DEF-14A_2023-04-12 in 2.36 sec.
2025-11-14 15:36:49,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\DEF-14A_2023-04-12' --> 'data\processed_data\AMT\DEF-14A_2023-04-12.md'


2025-11-14 15:36:50,145 - INFO - Going to convert document batch...
2025-11-14 15:36:50,146 - INFO - Processing document DEF-14A_2024-04-10
2025-11-14 15:36:52,019 - INFO - Finished converting document DEF-14A_2024-04-10 in 2.33 sec.
2025-11-14 15:36:52,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\DEF-14A_2024-04-10' --> 'data\processed_data\AMT\DEF-14A_2024-04-10.md'


2025-11-14 15:36:53,655 - INFO - Going to convert document batch...
2025-11-14 15:36:53,656 - INFO - Processing document DEF-14A_2025-04-02
2025-11-14 15:36:56,890 - INFO - Finished converting document DEF-14A_2025-04-02 in 4.08 sec.
2025-11-14 15:36:58,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\DEF-14A_2025-04-02' --> 'data\processed_data\AMT\DEF-14A_2025-04-02.md'
Processed 130 new files. Errors: 16
Found 169 files to process in data\edgar_documents\AMZN


2025-11-14 15:36:59,170 - INFO - Going to convert document batch...
2025-11-14 15:36:59,170 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:36:59,170 - INFO - Processing document 10-K_2023-02-03
2025-11-14 15:37:00,025 - INFO - Finished converting document 10-K_2023-02-03 in 1.56 sec.
2025-11-14 15:37:00,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-K_2023-02-03' --> 'data\processed_data\AMZN\10-K_2023-02-03.md'


2025-11-14 15:37:01,007 - INFO - Going to convert document batch...
2025-11-14 15:37:01,007 - INFO - Processing document 10-K_2024-02-02
2025-11-14 15:37:01,888 - INFO - Finished converting document 10-K_2024-02-02 in 1.52 sec.
2025-11-14 15:37:02,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-K_2024-02-02' --> 'data\processed_data\AMZN\10-K_2024-02-02.md'


2025-11-14 15:37:02,670 - INFO - Going to convert document batch...
2025-11-14 15:37:02,670 - INFO - Processing document 10-K_2025-02-07
2025-11-14 15:37:03,548 - INFO - Finished converting document 10-K_2025-02-07 in 1.30 sec.
2025-11-14 15:37:03,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-K_2025-02-07' --> 'data\processed_data\AMZN\10-K_2025-02-07.md'


2025-11-14 15:37:04,506 - INFO - Going to convert document batch...
2025-11-14 15:37:04,507 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 15:37:04,953 - INFO - Finished converting document 10-Q_2023-04-28 in 1.05 sec.
2025-11-14 15:37:05,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2023-04-28' --> 'data\processed_data\AMZN\10-Q_2023-04-28.md'


2025-11-14 15:37:05,491 - INFO - Going to convert document batch...
2025-11-14 15:37:05,492 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 15:37:06,023 - INFO - Finished converting document 10-Q_2023-08-04 in 0.83 sec.
2025-11-14 15:37:06,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2023-08-04' --> 'data\processed_data\AMZN\10-Q_2023-08-04.md'


2025-11-14 15:37:06,605 - INFO - Going to convert document batch...
2025-11-14 15:37:06,606 - INFO - Processing document 10-Q_2023-10-27
2025-11-14 15:37:07,424 - INFO - Finished converting document 10-Q_2023-10-27 in 1.12 sec.
2025-11-14 15:37:07,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2023-10-27' --> 'data\processed_data\AMZN\10-Q_2023-10-27.md'


2025-11-14 15:37:07,999 - INFO - Going to convert document batch...
2025-11-14 15:37:07,999 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 15:37:08,508 - INFO - Finished converting document 10-Q_2024-05-01 in 0.80 sec.
2025-11-14 15:37:08,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2024-05-01' --> 'data\processed_data\AMZN\10-Q_2024-05-01.md'


2025-11-14 15:37:09,080 - INFO - Going to convert document batch...
2025-11-14 15:37:09,081 - INFO - Processing document 10-Q_2024-08-02
2025-11-14 15:37:09,628 - INFO - Finished converting document 10-Q_2024-08-02 in 0.86 sec.
2025-11-14 15:37:09,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2024-08-02' --> 'data\processed_data\AMZN\10-Q_2024-08-02.md'


2025-11-14 15:37:10,587 - INFO - Going to convert document batch...
2025-11-14 15:37:10,588 - INFO - Processing document 10-Q_2024-11-01
2025-11-14 15:37:11,147 - INFO - Finished converting document 10-Q_2024-11-01 in 1.22 sec.
2025-11-14 15:37:11,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2024-11-01' --> 'data\processed_data\AMZN\10-Q_2024-11-01.md'


2025-11-14 15:37:11,692 - INFO - Going to convert document batch...
2025-11-14 15:37:11,692 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 15:37:12,152 - INFO - Finished converting document 10-Q_2025-05-02 in 0.73 sec.
2025-11-14 15:37:12,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2025-05-02' --> 'data\processed_data\AMZN\10-Q_2025-05-02.md'


2025-11-14 15:37:12,999 - INFO - Going to convert document batch...
2025-11-14 15:37:12,999 - INFO - Processing document 10-Q_2025-08-01
2025-11-14 15:37:13,583 - INFO - Finished converting document 10-Q_2025-08-01 in 1.19 sec.
2025-11-14 15:37:13,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2025-08-01' --> 'data\processed_data\AMZN\10-Q_2025-08-01.md'


2025-11-14 15:37:14,220 - INFO - Going to convert document batch...
2025-11-14 15:37:14,221 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 15:37:14,786 - INFO - Finished converting document 10-Q_2025-10-31 in 0.89 sec.
2025-11-14 15:37:15,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,088 - INFO - Going to convert document batch...
2025-11-14 15:37:15,089 - INFO - Processing document 4_2023-02-06
2025-11-14 15:37:15,124 - INFO - Finished converting document 4_2023-02-06 in 0.06 sec.
2025-11-14 15:37:15,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,232 - INFO - Going to convert document batch...
2025-11-14 15:37:15,233 - INFO - Processing document 4_2023-02-08
2025-11-14 15:37:15,251 - INFO - Finished converting document 4_2023-02-08 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\10-Q_2025-10-31' --> 'data\processed_data\AMZN\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\AMZN\4_2023-02-06' --> 'data\processed_data\AMZN\4_2023-02-06.md'


2025-11-14 15:37:15,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,292 - INFO - Going to convert document batch...
2025-11-14 15:37:15,293 - INFO - Processing document 4_2023-02-17
2025-11-14 15:37:15,317 - INFO - Finished converting document 4_2023-02-17 in 0.05 sec.
2025-11-14 15:37:15,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,390 - INFO - Going to convert document batch...
2025-11-14 15:37:15,391 - INFO - Processing document 4_2023-02-23
2025-11-14 15:37:15,416 - INFO - Finished converting document 4_2023-02-23 in 0.06 sec.
2025-11-14 15:37:15,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-02-08' --> 'data\processed_data\AMZN\4_2023-02-08.md'
Converted 'data\edgar_documents\AMZN\4_2023-02-17' --> 'data\processed_data\AMZN\4_2023-02-17.md'
Converted 'data\edgar_documents\AMZN\4_2023-02-23' --> 'data\processed_data\AMZN\4_2023-02-23.md'


2025-11-14 15:37:15,465 - INFO - Going to convert document batch...
2025-11-14 15:37:15,466 - INFO - Processing document 4_2023-02-24
2025-11-14 15:37:15,486 - INFO - Finished converting document 4_2023-02-24 in 0.05 sec.
2025-11-14 15:37:15,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,525 - INFO - Going to convert document batch...
2025-11-14 15:37:15,526 - INFO - Processing document 4_2023-03-03
2025-11-14 15:37:15,546 - INFO - Finished converting document 4_2023-03-03 in 0.05 sec.
2025-11-14 15:37:15,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,585 - INFO - Going to convert document batch...
2025-11-14 15:37:15,586 - INFO - Processing document 4_2023-03-23
2025-11-14 15:37:15,607 - INFO - Finished converting document 4_2023-03-23 in 0.05 sec.
2025-11-14 15:37:15,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,654 - INFO - Going to convert document batch...
2025-11-14 15:37:15,655 - 

Converted 'data\edgar_documents\AMZN\4_2023-02-24' --> 'data\processed_data\AMZN\4_2023-02-24.md'
Converted 'data\edgar_documents\AMZN\4_2023-03-03' --> 'data\processed_data\AMZN\4_2023-03-03.md'
Converted 'data\edgar_documents\AMZN\4_2023-03-23' --> 'data\processed_data\AMZN\4_2023-03-23.md'
Converted 'data\edgar_documents\AMZN\4_2023-04-05' --> 'data\processed_data\AMZN\4_2023-04-05.md'


2025-11-14 15:37:15,716 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,726 - INFO - Going to convert document batch...
2025-11-14 15:37:15,727 - INFO - Processing document 4_2023-04-06
2025-11-14 15:37:15,753 - INFO - Finished converting document 4_2023-04-06 in 0.05 sec.
2025-11-14 15:37:15,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,806 - INFO - Going to convert document batch...
2025-11-14 15:37:15,807 - INFO - Processing document 4_2023-04-21
2025-11-14 15:37:15,835 - INFO - Finished converting document 4_2023-04-21 in 0.05 sec.
2025-11-14 15:37:15,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,888 - INFO - Going to convert document batch...
2025-11-14 15:37:15,889 - INFO - Processing document 4_2023-05-03
2025-11-14 15:37:15,909 - INFO - Finished converting document 4_2023-05-03 in 0.03 sec.
2025-11-14 15:37:15,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMZN\4_2023-04-06' --> 'data\processed_data\AMZN\4_2023-04-06.md'
Converted 'data\edgar_documents\AMZN\4_2023-04-21' --> 'data\processed_data\AMZN\4_2023-04-21.md'
Converted 'data\edgar_documents\AMZN\4_2023-05-03' --> 'data\processed_data\AMZN\4_2023-05-03.md'


2025-11-14 15:37:15,983 - INFO - Finished converting document 4_2023-05-08 in 0.05 sec.
2025-11-14 15:37:16,023 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,037 - INFO - Going to convert document batch...
2025-11-14 15:37:16,037 - INFO - Processing document 4_2023-05-17
2025-11-14 15:37:16,069 - INFO - Finished converting document 4_2023-05-17 in 0.05 sec.
2025-11-14 15:37:16,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,148 - INFO - Going to convert document batch...
2025-11-14 15:37:16,149 - INFO - Processing document 4_2023-05-18
2025-11-14 15:37:16,172 - INFO - Finished converting document 4_2023-05-18 in 0.06 sec.
2025-11-14 15:37:16,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-05-08' --> 'data\processed_data\AMZN\4_2023-05-08.md'
Converted 'data\edgar_documents\AMZN\4_2023-05-17' --> 'data\processed_data\AMZN\4_2023-05-17.md'
Converted 'data\edgar_documents\AMZN\4_2023-05-18' --> 'data\processed_data\AMZN\4_2023-05-18.md'


2025-11-14 15:37:16,222 - INFO - Going to convert document batch...
2025-11-14 15:37:16,223 - INFO - Processing document 4_2023-05-23
2025-11-14 15:37:16,258 - INFO - Finished converting document 4_2023-05-23 in 0.05 sec.
2025-11-14 15:37:16,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-05-23' --> 'data\processed_data\AMZN\4_2023-05-23.md'


2025-11-14 15:37:16,652 - INFO - Going to convert document batch...
2025-11-14 15:37:16,653 - INFO - Processing document 4_2023-05-26
2025-11-14 15:37:16,673 - INFO - Finished converting document 4_2023-05-26 in 0.38 sec.
2025-11-14 15:37:16,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,720 - INFO - Going to convert document batch...
2025-11-14 15:37:16,721 - INFO - Processing document 4_2023-06-05
2025-11-14 15:37:16,740 - INFO - Finished converting document 4_2023-06-05 in 0.03 sec.
2025-11-14 15:37:16,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,806 - INFO - Going to convert document batch...
2025-11-14 15:37:16,807 - INFO - Processing document 4_2023-06-08
2025-11-14 15:37:16,837 - INFO - Finished converting document 4_2023-06-08 in 0.06 sec.
2025-11-14 15:37:16,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-05-26' --> 'data\processed_data\AMZN\4_2023-05-26.md'
Converted 'data\edgar_documents\AMZN\4_2023-06-05' --> 'data\processed_data\AMZN\4_2023-06-05.md'
Converted 'data\edgar_documents\AMZN\4_2023-06-08' --> 'data\processed_data\AMZN\4_2023-06-08.md'


2025-11-14 15:37:16,909 - INFO - Going to convert document batch...
2025-11-14 15:37:16,911 - INFO - Processing document 4_2023-06-23
2025-11-14 15:37:16,944 - INFO - Finished converting document 4_2023-06-23 in 0.08 sec.
2025-11-14 15:37:16,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,994 - INFO - Going to convert document batch...
2025-11-14 15:37:16,994 - INFO - Processing document 4_2023-07-06
2025-11-14 15:37:17,013 - INFO - Finished converting document 4_2023-07-06 in 0.05 sec.
2025-11-14 15:37:17,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,057 - INFO - Going to convert document batch...
2025-11-14 15:37:17,058 - INFO - Processing document 4_2023-07-10
2025-11-14 15:37:17,084 - INFO - Finished converting document 4_2023-07-10 in 0.05 sec.
2025-11-14 15:37:17,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,158 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2023-06-23' --> 'data\processed_data\AMZN\4_2023-06-23.md'
Converted 'data\edgar_documents\AMZN\4_2023-07-06' --> 'data\processed_data\AMZN\4_2023-07-06.md'
Converted 'data\edgar_documents\AMZN\4_2023-07-10' --> 'data\processed_data\AMZN\4_2023-07-10.md'


2025-11-14 15:37:17,161 - INFO - Processing document 4_2023-07-26
2025-11-14 15:37:17,182 - INFO - Finished converting document 4_2023-07-26 in 0.08 sec.
2025-11-14 15:37:17,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,223 - INFO - Going to convert document batch...
2025-11-14 15:37:17,224 - INFO - Processing document 4_2023-08-03
2025-11-14 15:37:17,242 - INFO - Finished converting document 4_2023-08-03 in 0.03 sec.
2025-11-14 15:37:17,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,303 - INFO - Going to convert document batch...
2025-11-14 15:37:17,305 - INFO - Processing document 4_2023-08-08
2025-11-14 15:37:17,353 - INFO - Finished converting document 4_2023-08-08 in 0.08 sec.
2025-11-14 15:37:17,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-07-26' --> 'data\processed_data\AMZN\4_2023-07-26.md'
Converted 'data\edgar_documents\AMZN\4_2023-08-03' --> 'data\processed_data\AMZN\4_2023-08-03.md'
Converted 'data\edgar_documents\AMZN\4_2023-08-08' --> 'data\processed_data\AMZN\4_2023-08-08.md'


2025-11-14 15:37:17,393 - INFO - Going to convert document batch...
2025-11-14 15:37:17,393 - INFO - Processing document 4_2023-08-11
2025-11-14 15:37:17,411 - INFO - Finished converting document 4_2023-08-11 in 0.03 sec.
2025-11-14 15:37:17,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,457 - INFO - Going to convert document batch...
2025-11-14 15:37:17,457 - INFO - Processing document 4_2023-08-17
2025-11-14 15:37:17,486 - INFO - Finished converting document 4_2023-08-17 in 0.05 sec.
2025-11-14 15:37:17,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,537 - INFO - Going to convert document batch...
2025-11-14 15:37:17,539 - INFO - Processing document 4_2023-08-23
2025-11-14 15:37:17,572 - INFO - Finished converting document 4_2023-08-23 in 0.05 sec.
2025-11-14 15:37:17,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,623 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2023-08-11' --> 'data\processed_data\AMZN\4_2023-08-11.md'
Converted 'data\edgar_documents\AMZN\4_2023-08-17' --> 'data\processed_data\AMZN\4_2023-08-17.md'
Converted 'data\edgar_documents\AMZN\4_2023-08-23' --> 'data\processed_data\AMZN\4_2023-08-23.md'


2025-11-14 15:37:17,624 - INFO - Processing document 4_2023-09-06
2025-11-14 15:37:17,645 - INFO - Finished converting document 4_2023-09-06 in 0.05 sec.
2025-11-14 15:37:17,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,688 - INFO - Going to convert document batch...
2025-11-14 15:37:17,689 - INFO - Processing document 4_2023-09-07
2025-11-14 15:37:17,710 - INFO - Finished converting document 4_2023-09-07 in 0.05 sec.
2025-11-14 15:37:17,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,752 - INFO - Going to convert document batch...
2025-11-14 15:37:17,753 - INFO - Processing document 4_2023-09-13
2025-11-14 15:37:17,773 - INFO - Finished converting document 4_2023-09-13 in 0.03 sec.
2025-11-14 15:37:17,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,829 - INFO - Going to convert document batch...
2025-11-14 15:37:17,829 - INFO - Processing document 4_2023-09-18


Converted 'data\edgar_documents\AMZN\4_2023-09-06' --> 'data\processed_data\AMZN\4_2023-09-06.md'
Converted 'data\edgar_documents\AMZN\4_2023-09-07' --> 'data\processed_data\AMZN\4_2023-09-07.md'
Converted 'data\edgar_documents\AMZN\4_2023-09-13' --> 'data\processed_data\AMZN\4_2023-09-13.md'


2025-11-14 15:37:17,847 - INFO - Finished converting document 4_2023-09-18 in 0.05 sec.
2025-11-14 15:37:17,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,888 - INFO - Going to convert document batch...
2025-11-14 15:37:17,889 - INFO - Processing document 4_2023-09-22
2025-11-14 15:37:17,911 - INFO - Finished converting document 4_2023-09-22 in 0.05 sec.
2025-11-14 15:37:17,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,952 - INFO - Going to convert document batch...
2025-11-14 15:37:17,952 - INFO - Processing document 4_2023-10-04
2025-11-14 15:37:17,971 - INFO - Finished converting document 4_2023-10-04 in 0.03 sec.
2025-11-14 15:37:18,002 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,013 - INFO - Going to convert document batch...
2025-11-14 15:37:18,014 - INFO - Processing document 4_2023-10-10
2025-11-14 15:37:18,035 - INFO - Finished converting document 4_2023-10-10 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2023-09-18' --> 'data\processed_data\AMZN\4_2023-09-18.md'
Converted 'data\edgar_documents\AMZN\4_2023-09-22' --> 'data\processed_data\AMZN\4_2023-09-22.md'
Converted 'data\edgar_documents\AMZN\4_2023-10-04' --> 'data\processed_data\AMZN\4_2023-10-04.md'


2025-11-14 15:37:18,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,081 - INFO - Going to convert document batch...
2025-11-14 15:37:18,082 - INFO - Processing document 4_2023-10-23
2025-11-14 15:37:18,102 - INFO - Finished converting document 4_2023-10-23 in 0.03 sec.
2025-11-14 15:37:18,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,164 - INFO - Going to convert document batch...
2025-11-14 15:37:18,164 - INFO - Processing document 4_2023-11-01
2025-11-14 15:37:18,185 - INFO - Finished converting document 4_2023-11-01 in 0.06 sec.
2025-11-14 15:37:18,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,225 - INFO - Going to convert document batch...
2025-11-14 15:37:18,225 - INFO - Processing document 4_2023-11-03
2025-11-14 15:37:18,242 - INFO - Finished converting document 4_2023-11-03 in 0.03 sec.
2025-11-14 15:37:18,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-10-10' --> 'data\processed_data\AMZN\4_2023-10-10.md'
Converted 'data\edgar_documents\AMZN\4_2023-10-23' --> 'data\processed_data\AMZN\4_2023-10-23.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-01' --> 'data\processed_data\AMZN\4_2023-11-01.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-03' --> 'data\processed_data\AMZN\4_2023-11-03.md'


2025-11-14 15:37:18,282 - INFO - Going to convert document batch...
2025-11-14 15:37:18,282 - INFO - Processing document 4_2023-11-06
2025-11-14 15:37:18,303 - INFO - Finished converting document 4_2023-11-06 in 0.03 sec.
2025-11-14 15:37:18,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,343 - INFO - Going to convert document batch...
2025-11-14 15:37:18,344 - INFO - Processing document 4_2023-11-15
2025-11-14 15:37:18,363 - INFO - Finished converting document 4_2023-11-15 in 0.03 sec.
2025-11-14 15:37:18,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,414 - INFO - Going to convert document batch...
2025-11-14 15:37:18,415 - INFO - Processing document 4_2023-11-17
2025-11-14 15:37:18,444 - INFO - Finished converting document 4_2023-11-17 in 0.06 sec.
2025-11-14 15:37:18,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,501 - INFO - Going to convert document batch...
2025-11-14 15:37:18,502 - 

Converted 'data\edgar_documents\AMZN\4_2023-11-06' --> 'data\processed_data\AMZN\4_2023-11-06.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-15' --> 'data\processed_data\AMZN\4_2023-11-15.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-17' --> 'data\processed_data\AMZN\4_2023-11-17.md'


2025-11-14 15:37:18,536 - INFO - Finished converting document 4_2023-11-24 in 0.06 sec.
2025-11-14 15:37:18,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,586 - INFO - Going to convert document batch...
2025-11-14 15:37:18,587 - INFO - Processing document 4_2023-11-27
2025-11-14 15:37:18,607 - INFO - Finished converting document 4_2023-11-27 in 0.05 sec.
2025-11-14 15:37:18,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,644 - INFO - Going to convert document batch...
2025-11-14 15:37:18,645 - INFO - Processing document 4_2023-12-05
2025-11-14 15:37:18,664 - INFO - Finished converting document 4_2023-12-05 in 0.03 sec.
2025-11-14 15:37:18,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,721 - INFO - Going to convert document batch...
2025-11-14 15:37:18,721 - INFO - Processing document 4_2023-12-08
2025-11-14 15:37:18,740 - INFO - Finished converting document 4_2023-12-08 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2023-11-24' --> 'data\processed_data\AMZN\4_2023-11-24.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-27' --> 'data\processed_data\AMZN\4_2023-11-27.md'
Converted 'data\edgar_documents\AMZN\4_2023-12-05' --> 'data\processed_data\AMZN\4_2023-12-05.md'


2025-11-14 15:37:18,777 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,786 - INFO - Going to convert document batch...
2025-11-14 15:37:18,787 - INFO - Processing document 4_2023-12-26
2025-11-14 15:37:18,815 - INFO - Finished converting document 4_2023-12-26 in 0.05 sec.
2025-11-14 15:37:18,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,891 - INFO - Going to convert document batch...
2025-11-14 15:37:18,893 - INFO - Processing document 4_2024-01-08
2025-11-14 15:37:18,926 - INFO - Finished converting document 4_2024-01-08 in 0.08 sec.


Converted 'data\edgar_documents\AMZN\4_2023-12-08' --> 'data\processed_data\AMZN\4_2023-12-08.md'
Converted 'data\edgar_documents\AMZN\4_2023-12-26' --> 'data\processed_data\AMZN\4_2023-12-26.md'


2025-11-14 15:37:18,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,974 - INFO - Going to convert document batch...
2025-11-14 15:37:18,975 - INFO - Processing document 4_2024-01-22
2025-11-14 15:37:19,003 - INFO - Finished converting document 4_2024-01-22 in 0.05 sec.
2025-11-14 15:37:19,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,050 - INFO - Going to convert document batch...
2025-11-14 15:37:19,051 - INFO - Processing document 4_2024-02-05
2025-11-14 15:37:19,072 - INFO - Finished converting document 4_2024-02-05 in 0.03 sec.
2025-11-14 15:37:19,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,113 - INFO - Going to convert document batch...
2025-11-14 15:37:19,114 - INFO - Processing document 4_2024-02-09
2025-11-14 15:37:19,135 - INFO - Finished converting document 4_2024-02-09 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-01-08' --> 'data\processed_data\AMZN\4_2024-01-08.md'
Converted 'data\edgar_documents\AMZN\4_2024-01-22' --> 'data\processed_data\AMZN\4_2024-01-22.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-05' --> 'data\processed_data\AMZN\4_2024-02-05.md'


2025-11-14 15:37:19,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,178 - INFO - Going to convert document batch...
2025-11-14 15:37:19,179 - INFO - Processing document 4_2024-02-13
2025-11-14 15:37:19,197 - INFO - Finished converting document 4_2024-02-13 in 0.03 sec.
2025-11-14 15:37:19,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,235 - INFO - Going to convert document batch...
2025-11-14 15:37:19,236 - INFO - Processing document 4_2024-02-14
2025-11-14 15:37:19,253 - INFO - Finished converting document 4_2024-02-14 in 0.03 sec.
2025-11-14 15:37:19,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,298 - INFO - Going to convert document batch...
2025-11-14 15:37:19,299 - INFO - Processing document 4_2024-02-15
2025-11-14 15:37:19,328 - INFO - Finished converting document 4_2024-02-15 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\4_2024-02-09' --> 'data\processed_data\AMZN\4_2024-02-09.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-13' --> 'data\processed_data\AMZN\4_2024-02-13.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-14' --> 'data\processed_data\AMZN\4_2024-02-14.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-15' --> 'data\processed_data\AMZN\4_2024-02-15.md'


2025-11-14 15:37:19,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,394 - INFO - Going to convert document batch...
2025-11-14 15:37:19,395 - INFO - Processing document 4_2024-02-20
2025-11-14 15:37:19,416 - INFO - Finished converting document 4_2024-02-20 in 0.05 sec.
2025-11-14 15:37:19,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,460 - INFO - Going to convert document batch...
2025-11-14 15:37:19,461 - INFO - Processing document 4_2024-02-23
2025-11-14 15:37:19,492 - INFO - Finished converting document 4_2024-02-23 in 0.05 sec.
2025-11-14 15:37:19,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,540 - INFO - Going to convert document batch...
2025-11-14 15:37:19,541 - INFO - Processing document 4_2024-03-04
2025-11-14 15:37:19,560 - INFO - Finished converting document 4_2024-03-04 in 0.05 sec.
2025-11-14 15:37:19,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMZN\4_2024-02-20' --> 'data\processed_data\AMZN\4_2024-02-20.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-23' --> 'data\processed_data\AMZN\4_2024-02-23.md'
Converted 'data\edgar_documents\AMZN\4_2024-03-04' --> 'data\processed_data\AMZN\4_2024-03-04.md'


2025-11-14 15:37:19,621 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 15:37:19,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,660 - INFO - Going to convert document batch...
2025-11-14 15:37:19,661 - INFO - Processing document 4_2024-03-06
2025-11-14 15:37:19,679 - INFO - Finished converting document 4_2024-03-06 in 0.03 sec.
2025-11-14 15:37:19,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,717 - INFO - Going to convert document batch...
2025-11-14 15:37:19,718 - INFO - Processing document 4_2024-03-11
2025-11-14 15:37:19,738 - INFO - Finished converting document 4_2024-03-11 in 0.03 sec.
2025-11-14 15:37:19,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,782 - INFO - Going to convert document batch...
2025-11-14 15:37:19,783 - INFO - Processing document 4_2024-03-25
2025-11-14 15:37:19,803 - INFO - Finished converting document 4_2024-03-25 in 0.05 sec.
2025-1

Converted 'data\edgar_documents\AMZN\4_2024-03-05' --> 'data\processed_data\AMZN\4_2024-03-05.md'
Converted 'data\edgar_documents\AMZN\4_2024-03-06' --> 'data\processed_data\AMZN\4_2024-03-06.md'
Converted 'data\edgar_documents\AMZN\4_2024-03-11' --> 'data\processed_data\AMZN\4_2024-03-11.md'
Converted 'data\edgar_documents\AMZN\4_2024-03-25' --> 'data\processed_data\AMZN\4_2024-03-25.md'


2025-11-14 15:37:19,845 - INFO - Going to convert document batch...
2025-11-14 15:37:19,846 - INFO - Processing document 4_2024-04-03
2025-11-14 15:37:19,887 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 15:37:19,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,939 - INFO - Going to convert document batch...
2025-11-14 15:37:19,940 - INFO - Processing document 4_2024-04-08
2025-11-14 15:37:19,962 - INFO - Finished converting document 4_2024-04-08 in 0.03 sec.
2025-11-14 15:37:20,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,020 - INFO - Going to convert document batch...
2025-11-14 15:37:20,021 - INFO - Processing document 4_2024-04-12
2025-11-14 15:37:20,040 - INFO - Finished converting document 4_2024-04-12 in 0.05 sec.
2025-11-14 15:37:20,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,082 - INFO - Going to convert document batch...
2025-11-14 15:37:20,083 - 

Converted 'data\edgar_documents\AMZN\4_2024-04-03' --> 'data\processed_data\AMZN\4_2024-04-03.md'
Converted 'data\edgar_documents\AMZN\4_2024-04-08' --> 'data\processed_data\AMZN\4_2024-04-08.md'
Converted 'data\edgar_documents\AMZN\4_2024-04-12' --> 'data\processed_data\AMZN\4_2024-04-12.md'


2025-11-14 15:37:20,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,150 - INFO - Going to convert document batch...
2025-11-14 15:37:20,151 - INFO - Processing document 4_2024-05-03
2025-11-14 15:37:20,188 - INFO - Finished converting document 4_2024-05-03 in 0.06 sec.
2025-11-14 15:37:20,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,252 - INFO - Going to convert document batch...
2025-11-14 15:37:20,253 - INFO - Processing document 4_2024-05-08
2025-11-14 15:37:20,269 - INFO - Finished converting document 4_2024-05-08 in 0.05 sec.
2025-11-14 15:37:20,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,309 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2024-04-22' --> 'data\processed_data\AMZN\4_2024-04-22.md'
Converted 'data\edgar_documents\AMZN\4_2024-05-03' --> 'data\processed_data\AMZN\4_2024-05-03.md'
Converted 'data\edgar_documents\AMZN\4_2024-05-08' --> 'data\processed_data\AMZN\4_2024-05-08.md'


2025-11-14 15:37:20,310 - INFO - Processing document 4_2024-05-13
2025-11-14 15:37:20,327 - INFO - Finished converting document 4_2024-05-13 in 0.03 sec.
2025-11-14 15:37:20,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2024-05-13' --> 'data\processed_data\AMZN\4_2024-05-13.md'


2025-11-14 15:37:20,611 - INFO - Going to convert document batch...
2025-11-14 15:37:20,612 - INFO - Processing document 4_2024-05-17
2025-11-14 15:37:20,645 - INFO - Finished converting document 4_2024-05-17 in 0.30 sec.
2025-11-14 15:37:20,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,698 - INFO - Going to convert document batch...
2025-11-14 15:37:20,699 - INFO - Processing document 4_2024-05-23
2025-11-14 15:37:20,727 - INFO - Finished converting document 4_2024-05-23 in 0.05 sec.
2025-11-14 15:37:20,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,778 - INFO - Going to convert document batch...
2025-11-14 15:37:20,779 - INFO - Processing document 4_2024-05-31
2025-11-14 15:37:20,797 - INFO - Finished converting document 4_2024-05-31 in 0.05 sec.
2025-11-14 15:37:20,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,837 - INFO - Going to convert document batch...
2025-11-14 15:37:20,838 - 

Converted 'data\edgar_documents\AMZN\4_2024-05-17' --> 'data\processed_data\AMZN\4_2024-05-17.md'
Converted 'data\edgar_documents\AMZN\4_2024-05-23' --> 'data\processed_data\AMZN\4_2024-05-23.md'
Converted 'data\edgar_documents\AMZN\4_2024-05-31' --> 'data\processed_data\AMZN\4_2024-05-31.md'


2025-11-14 15:37:20,888 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,897 - INFO - Going to convert document batch...
2025-11-14 15:37:20,899 - INFO - Processing document 4_2024-07-01
2025-11-14 15:37:20,922 - INFO - Finished converting document 4_2024-07-01 in 0.05 sec.
2025-11-14 15:37:20,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,987 - INFO - Going to convert document batch...
2025-11-14 15:37:20,988 - INFO - Processing document 4_2024-07-03
2025-11-14 15:37:21,012 - INFO - Finished converting document 4_2024-07-03 in 0.06 sec.
2025-11-14 15:37:21,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,057 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2024-06-05' --> 'data\processed_data\AMZN\4_2024-06-05.md'
Converted 'data\edgar_documents\AMZN\4_2024-07-01' --> 'data\processed_data\AMZN\4_2024-07-01.md'
Converted 'data\edgar_documents\AMZN\4_2024-07-03' --> 'data\processed_data\AMZN\4_2024-07-03.md'


2025-11-14 15:37:21,058 - INFO - Processing document 4_2024-07-05
2025-11-14 15:37:21,078 - INFO - Finished converting document 4_2024-07-05 in 0.05 sec.
2025-11-14 15:37:21,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,121 - INFO - Going to convert document batch...
2025-11-14 15:37:21,122 - INFO - Processing document 4_2024-07-09
2025-11-14 15:37:21,143 - INFO - Finished converting document 4_2024-07-09 in 0.05 sec.
2025-11-14 15:37:21,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,212 - INFO - Going to convert document batch...
2025-11-14 15:37:21,213 - INFO - Processing document 4_2024-07-11
2025-11-14 15:37:21,241 - INFO - Finished converting document 4_2024-07-11 in 0.08 sec.
2025-11-14 15:37:21,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,281 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2024-07-05' --> 'data\processed_data\AMZN\4_2024-07-05.md'
Converted 'data\edgar_documents\AMZN\4_2024-07-09' --> 'data\processed_data\AMZN\4_2024-07-09.md'
Converted 'data\edgar_documents\AMZN\4_2024-07-11' --> 'data\processed_data\AMZN\4_2024-07-11.md'


2025-11-14 15:37:21,282 - INFO - Processing document 4_2024-07-15
2025-11-14 15:37:21,306 - INFO - Finished converting document 4_2024-07-15 in 0.03 sec.
2025-11-14 15:37:21,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,349 - INFO - Going to convert document batch...
2025-11-14 15:37:21,350 - INFO - Processing document 4_2024-08-05
2025-11-14 15:37:21,368 - INFO - Finished converting document 4_2024-08-05 in 0.03 sec.
2025-11-14 15:37:21,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,429 - INFO - Going to convert document batch...
2025-11-14 15:37:21,429 - INFO - Processing document 4_2024-08-19
2025-11-14 15:37:21,453 - INFO - Finished converting document 4_2024-08-19 in 0.06 sec.
2025-11-14 15:37:21,490 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,502 - INFO - Going to convert document batch...
2025-11-14 15:37:21,503 - INFO - Processing document 4_2024-08-23
2025-11-14 15:37:21,534 - IN

Converted 'data\edgar_documents\AMZN\4_2024-07-15' --> 'data\processed_data\AMZN\4_2024-07-15.md'
Converted 'data\edgar_documents\AMZN\4_2024-08-05' --> 'data\processed_data\AMZN\4_2024-08-05.md'
Converted 'data\edgar_documents\AMZN\4_2024-08-19' --> 'data\processed_data\AMZN\4_2024-08-19.md'


2025-11-14 15:37:21,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,606 - INFO - Going to convert document batch...
2025-11-14 15:37:21,607 - INFO - Processing document 4_2024-08-30
2025-11-14 15:37:21,626 - INFO - Finished converting document 4_2024-08-30 in 0.06 sec.
2025-11-14 15:37:21,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,666 - INFO - Going to convert document batch...
2025-11-14 15:37:21,667 - INFO - Processing document 4_2024-09-05
2025-11-14 15:37:21,685 - INFO - Finished converting document 4_2024-09-05 in 0.05 sec.
2025-11-14 15:37:21,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,729 - INFO - Going to convert document batch...
2025-11-14 15:37:21,730 - INFO - Processing document 4_2024-09-11
2025-11-14 15:37:21,748 - INFO - Finished converting document 4_2024-09-11 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-08-23' --> 'data\processed_data\AMZN\4_2024-08-23.md'
Converted 'data\edgar_documents\AMZN\4_2024-08-30' --> 'data\processed_data\AMZN\4_2024-08-30.md'
Converted 'data\edgar_documents\AMZN\4_2024-09-05' --> 'data\processed_data\AMZN\4_2024-09-05.md'


2025-11-14 15:37:21,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,789 - INFO - Going to convert document batch...
2025-11-14 15:37:21,790 - INFO - Processing document 4_2024-09-26
2025-11-14 15:37:21,808 - INFO - Finished converting document 4_2024-09-26 in 0.05 sec.
2025-11-14 15:37:21,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,847 - INFO - Going to convert document batch...
2025-11-14 15:37:21,848 - INFO - Processing document 4_2024-10-03
2025-11-14 15:37:21,864 - INFO - Finished converting document 4_2024-10-03 in 0.03 sec.
2025-11-14 15:37:21,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,902 - INFO - Going to convert document batch...
2025-11-14 15:37:21,903 - INFO - Processing document 4_2024-11-05
2025-11-14 15:37:21,919 - INFO - Finished converting document 4_2024-11-05 in 0.05 sec.
2025-11-14 15:37:21,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2024-09-11' --> 'data\processed_data\AMZN\4_2024-09-11.md'
Converted 'data\edgar_documents\AMZN\4_2024-09-26' --> 'data\processed_data\AMZN\4_2024-09-26.md'
Converted 'data\edgar_documents\AMZN\4_2024-10-03' --> 'data\processed_data\AMZN\4_2024-10-03.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-05' --> 'data\processed_data\AMZN\4_2024-11-05.md'


2025-11-14 15:37:21,962 - INFO - Going to convert document batch...
2025-11-14 15:37:21,963 - INFO - Processing document 4_2024-11-06
2025-11-14 15:37:21,979 - INFO - Finished converting document 4_2024-11-06 in 0.05 sec.
2025-11-14 15:37:22,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,022 - INFO - Going to convert document batch...
2025-11-14 15:37:22,023 - INFO - Processing document 4_2024-11-08
2025-11-14 15:37:22,054 - INFO - Finished converting document 4_2024-11-08 in 0.05 sec.
2025-11-14 15:37:22,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,101 - INFO - Going to convert document batch...
2025-11-14 15:37:22,102 - INFO - Processing document 4_2024-11-12
2025-11-14 15:37:22,120 - INFO - Finished converting document 4_2024-11-12 in 0.05 sec.
2025-11-14 15:37:22,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,165 - INFO - Going to convert document batch...
2025-11-14 15:37:22,166 - 

Converted 'data\edgar_documents\AMZN\4_2024-11-06' --> 'data\processed_data\AMZN\4_2024-11-06.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-08' --> 'data\processed_data\AMZN\4_2024-11-08.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-12' --> 'data\processed_data\AMZN\4_2024-11-12.md'


2025-11-14 15:37:22,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,245 - INFO - Going to convert document batch...
2025-11-14 15:37:22,246 - INFO - Processing document 4_2024-11-19
2025-11-14 15:37:22,270 - INFO - Finished converting document 4_2024-11-19 in 0.05 sec.
2025-11-14 15:37:22,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,312 - INFO - Going to convert document batch...
2025-11-14 15:37:22,313 - INFO - Processing document 4_2024-11-20
2025-11-14 15:37:22,334 - INFO - Finished converting document 4_2024-11-20 in 0.03 sec.
2025-11-14 15:37:22,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,391 - INFO - Going to convert document batch...
2025-11-14 15:37:22,392 - INFO - Processing document 4_2024-11-21
2025-11-14 15:37:22,413 - INFO - Finished converting document 4_2024-11-21 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-11-14' --> 'data\processed_data\AMZN\4_2024-11-14.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-19' --> 'data\processed_data\AMZN\4_2024-11-19.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-20' --> 'data\processed_data\AMZN\4_2024-11-20.md'


2025-11-14 15:37:22,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,467 - INFO - Going to convert document batch...
2025-11-14 15:37:22,468 - INFO - Processing document 4_2024-11-25
2025-11-14 15:37:22,527 - INFO - Finished converting document 4_2024-11-25 in 0.09 sec.
2025-11-14 15:37:22,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,600 - INFO - Going to convert document batch...
2025-11-14 15:37:22,600 - INFO - Processing document 4_2024-12-04
2025-11-14 15:37:22,618 - INFO - Finished converting document 4_2024-12-04 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-11-21' --> 'data\processed_data\AMZN\4_2024-11-21.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-25' --> 'data\processed_data\AMZN\4_2024-11-25.md'


2025-11-14 15:37:22,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,659 - INFO - Going to convert document batch...
2025-11-14 15:37:22,660 - INFO - Processing document 4_2024-12-06
2025-11-14 15:37:22,679 - INFO - Finished converting document 4_2024-12-06 in 0.03 sec.
2025-11-14 15:37:22,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,718 - INFO - Going to convert document batch...
2025-11-14 15:37:22,719 - INFO - Processing document 4_2024-12-11
2025-11-14 15:37:22,737 - INFO - Finished converting document 4_2024-12-11 in 0.03 sec.
2025-11-14 15:37:22,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,780 - INFO - Going to convert document batch...
2025-11-14 15:37:22,782 - INFO - Processing document 4_2025-02-14
2025-11-14 15:37:22,805 - INFO - Finished converting document 4_2025-02-14 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-12-04' --> 'data\processed_data\AMZN\4_2024-12-04.md'
Converted 'data\edgar_documents\AMZN\4_2024-12-06' --> 'data\processed_data\AMZN\4_2024-12-06.md'
Converted 'data\edgar_documents\AMZN\4_2024-12-11' --> 'data\processed_data\AMZN\4_2024-12-11.md'
Converted 'data\edgar_documents\AMZN\4_2025-02-14' --> 'data\processed_data\AMZN\4_2025-02-14.md'


2025-11-14 15:37:22,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,872 - INFO - Going to convert document batch...
2025-11-14 15:37:22,873 - INFO - Processing document 4_2025-02-19
2025-11-14 15:37:22,903 - INFO - Finished converting document 4_2025-02-19 in 0.08 sec.
2025-11-14 15:37:22,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,952 - INFO - Going to convert document batch...
2025-11-14 15:37:22,953 - INFO - Processing document 4_2025-02-25
2025-11-14 15:37:22,983 - INFO - Finished converting document 4_2025-02-25 in 0.06 sec.
2025-11-14 15:37:23,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,030 - INFO - Going to convert document batch...
2025-11-14 15:37:23,031 - INFO - Processing document 4_2025-03-05
2025-11-14 15:37:23,048 - INFO - Finished converting document 4_2025-03-05 in 0.03 sec.
2025-11-14 15:37:23,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMZN\4_2025-02-19' --> 'data\processed_data\AMZN\4_2025-02-19.md'
Converted 'data\edgar_documents\AMZN\4_2025-02-25' --> 'data\processed_data\AMZN\4_2025-02-25.md'
Converted 'data\edgar_documents\AMZN\4_2025-03-05' --> 'data\processed_data\AMZN\4_2025-03-05.md'


2025-11-14 15:37:23,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,148 - INFO - Going to convert document batch...
2025-11-14 15:37:23,149 - INFO - Processing document 4_2025-04-03
2025-11-14 15:37:23,173 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.
2025-11-14 15:37:23,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,215 - INFO - Going to convert document batch...
2025-11-14 15:37:23,215 - INFO - Processing document 4_2025-04-14
2025-11-14 15:37:23,242 - INFO - Finished converting document 4_2025-04-14 in 0.05 sec.
2025-11-14 15:37:23,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,305 - INFO - Going to convert document batch...
2025-11-14 15:37:23,306 - INFO - Processing document 4_2025-05-05
2025-11-14 15:37:23,328 - INFO - Finished converting document 4_2025-05-05 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\4_2025-03-12' --> 'data\processed_data\AMZN\4_2025-03-12.md'
Converted 'data\edgar_documents\AMZN\4_2025-04-03' --> 'data\processed_data\AMZN\4_2025-04-03.md'
Converted 'data\edgar_documents\AMZN\4_2025-04-14' --> 'data\processed_data\AMZN\4_2025-04-14.md'


2025-11-14 15:37:23,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,366 - INFO - Going to convert document batch...
2025-11-14 15:37:23,367 - INFO - Processing document 4_2025-05-14
2025-11-14 15:37:23,384 - INFO - Finished converting document 4_2025-05-14 in 0.03 sec.
2025-11-14 15:37:23,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,456 - INFO - Going to convert document batch...
2025-11-14 15:37:23,458 - INFO - Processing document 4_2025-05-15
2025-11-14 15:37:23,480 - INFO - Finished converting document 4_2025-05-15 in 0.06 sec.
2025-11-14 15:37:23,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,525 - INFO - Going to convert document batch...
2025-11-14 15:37:23,526 - INFO - Processing document 4_2025-05-19


Converted 'data\edgar_documents\AMZN\4_2025-05-05' --> 'data\processed_data\AMZN\4_2025-05-05.md'
Converted 'data\edgar_documents\AMZN\4_2025-05-14' --> 'data\processed_data\AMZN\4_2025-05-14.md'
Converted 'data\edgar_documents\AMZN\4_2025-05-15' --> 'data\processed_data\AMZN\4_2025-05-15.md'


2025-11-14 15:37:23,551 - INFO - Finished converting document 4_2025-05-19 in 0.05 sec.
2025-11-14 15:37:23,587 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,595 - INFO - Going to convert document batch...
2025-11-14 15:37:23,596 - INFO - Processing document 4_2025-05-22
2025-11-14 15:37:23,615 - INFO - Finished converting document 4_2025-05-22 in 0.03 sec.
2025-11-14 15:37:23,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,694 - INFO - Going to convert document batch...
2025-11-14 15:37:23,695 - INFO - Processing document 4_2025-05-23
2025-11-14 15:37:23,722 - INFO - Finished converting document 4_2025-05-23 in 0.08 sec.
2025-11-14 15:37:23,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2025-05-19' --> 'data\processed_data\AMZN\4_2025-05-19.md'
Converted 'data\edgar_documents\AMZN\4_2025-05-22' --> 'data\processed_data\AMZN\4_2025-05-22.md'
Converted 'data\edgar_documents\AMZN\4_2025-05-23' --> 'data\processed_data\AMZN\4_2025-05-23.md'


2025-11-14 15:37:23,769 - INFO - Going to convert document batch...
2025-11-14 15:37:23,770 - INFO - Processing document 4_2025-06-04
2025-11-14 15:37:23,791 - INFO - Finished converting document 4_2025-06-04 in 0.05 sec.
2025-11-14 15:37:23,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,829 - INFO - Going to convert document batch...
2025-11-14 15:37:23,830 - INFO - Processing document 4_2025-06-05
2025-11-14 15:37:23,846 - INFO - Finished converting document 4_2025-06-05 in 0.03 sec.
2025-11-14 15:37:23,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,909 - INFO - Going to convert document batch...
2025-11-14 15:37:23,910 - INFO - Processing document 4_2025-07-01
2025-11-14 15:37:23,931 - INFO - Finished converting document 4_2025-07-01 in 0.06 sec.
2025-11-14 15:37:23,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,979 - INFO - Going to convert document batch...
2025-11-14 15:37:23,980 - 

Converted 'data\edgar_documents\AMZN\4_2025-06-04' --> 'data\processed_data\AMZN\4_2025-06-04.md'
Converted 'data\edgar_documents\AMZN\4_2025-06-05' --> 'data\processed_data\AMZN\4_2025-06-05.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-01' --> 'data\processed_data\AMZN\4_2025-07-01.md'


2025-11-14 15:37:24,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,045 - INFO - Going to convert document batch...
2025-11-14 15:37:24,046 - INFO - Processing document 4_2025-07-08
2025-11-14 15:37:24,064 - INFO - Finished converting document 4_2025-07-08 in 0.05 sec.
2025-11-14 15:37:24,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,110 - INFO - Going to convert document batch...
2025-11-14 15:37:24,111 - INFO - Processing document 4_2025-07-10
2025-11-14 15:37:24,129 - INFO - Finished converting document 4_2025-07-10 in 0.03 sec.
2025-11-14 15:37:24,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,202 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2025-07-03' --> 'data\processed_data\AMZN\4_2025-07-03.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-08' --> 'data\processed_data\AMZN\4_2025-07-08.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-10' --> 'data\processed_data\AMZN\4_2025-07-10.md'


2025-11-14 15:37:24,202 - INFO - Processing document 4_2025-07-15
2025-11-14 15:37:24,226 - INFO - Finished converting document 4_2025-07-15 in 0.08 sec.
2025-11-14 15:37:24,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,267 - INFO - Going to convert document batch...
2025-11-14 15:37:24,268 - INFO - Processing document 4_2025-07-17
2025-11-14 15:37:24,286 - INFO - Finished converting document 4_2025-07-17 in 0.03 sec.
2025-11-14 15:37:24,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2025-07-15' --> 'data\processed_data\AMZN\4_2025-07-15.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-17' --> 'data\processed_data\AMZN\4_2025-07-17.md'


2025-11-14 15:37:24,541 - INFO - Going to convert document batch...
2025-11-14 15:37:24,543 - INFO - Processing document 4_2025-07-23
2025-11-14 15:37:24,568 - INFO - Finished converting document 4_2025-07-23 in 0.27 sec.
2025-11-14 15:37:24,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,616 - INFO - Going to convert document batch...
2025-11-14 15:37:24,617 - INFO - Processing document 4_2025-07-25
2025-11-14 15:37:24,645 - INFO - Finished converting document 4_2025-07-25 in 0.05 sec.
2025-11-14 15:37:24,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,688 - INFO - Going to convert document batch...
2025-11-14 15:37:24,689 - INFO - Processing document 4_2025-08-05
2025-11-14 15:37:24,708 - INFO - Finished converting document 4_2025-08-05 in 0.03 sec.
2025-11-14 15:37:24,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,744 - INFO - Going to convert document batch...
2025-11-14 15:37:24,745 - 

Converted 'data\edgar_documents\AMZN\4_2025-07-23' --> 'data\processed_data\AMZN\4_2025-07-23.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-25' --> 'data\processed_data\AMZN\4_2025-07-25.md'
Converted 'data\edgar_documents\AMZN\4_2025-08-05' --> 'data\processed_data\AMZN\4_2025-08-05.md'


2025-11-14 15:37:24,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,807 - INFO - Going to convert document batch...
2025-11-14 15:37:24,808 - INFO - Processing document 4_2025-08-18
2025-11-14 15:37:24,827 - INFO - Finished converting document 4_2025-08-18 in 0.05 sec.
2025-11-14 15:37:24,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,869 - INFO - Going to convert document batch...
2025-11-14 15:37:24,870 - INFO - Processing document 4_2025-08-19
2025-11-14 15:37:24,895 - INFO - Finished converting document 4_2025-08-19 in 0.05 sec.
2025-11-14 15:37:24,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,983 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2025-08-12' --> 'data\processed_data\AMZN\4_2025-08-12.md'
Converted 'data\edgar_documents\AMZN\4_2025-08-18' --> 'data\processed_data\AMZN\4_2025-08-18.md'
Converted 'data\edgar_documents\AMZN\4_2025-08-19' --> 'data\processed_data\AMZN\4_2025-08-19.md'


2025-11-14 15:37:24,985 - INFO - Processing document 4_2025-08-25
2025-11-14 15:37:25,022 - INFO - Finished converting document 4_2025-08-25 in 0.09 sec.
2025-11-14 15:37:25,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,067 - INFO - Going to convert document batch...
2025-11-14 15:37:25,069 - INFO - Processing document 4_2025-09-02
2025-11-14 15:37:25,088 - INFO - Finished converting document 4_2025-09-02 in 0.03 sec.
2025-11-14 15:37:25,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,148 - INFO - Going to convert document batch...
2025-11-14 15:37:25,149 - INFO - Processing document 4_2025-09-04
2025-11-14 15:37:25,169 - INFO - Finished converting document 4_2025-09-04 in 0.06 sec.
2025-11-14 15:37:25,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,209 - INFO - Going to convert document batch...
2025-11-14 15:37:25,210 - INFO - Processing document 4_2025-09-10
2025-11-14 15:37:25,228 - IN

Converted 'data\edgar_documents\AMZN\4_2025-08-25' --> 'data\processed_data\AMZN\4_2025-08-25.md'
Converted 'data\edgar_documents\AMZN\4_2025-09-02' --> 'data\processed_data\AMZN\4_2025-09-02.md'
Converted 'data\edgar_documents\AMZN\4_2025-09-04' --> 'data\processed_data\AMZN\4_2025-09-04.md'


2025-11-14 15:37:25,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,266 - INFO - Going to convert document batch...
2025-11-14 15:37:25,267 - INFO - Processing document 4_2025-10-03
2025-11-14 15:37:25,285 - INFO - Finished converting document 4_2025-10-03 in 0.03 sec.
2025-11-14 15:37:25,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,333 - INFO - Going to convert document batch...
2025-11-14 15:37:25,334 - INFO - Processing document 4_2025-11-04
2025-11-14 15:37:25,354 - INFO - Finished converting document 4_2025-11-04 in 0.03 sec.
2025-11-14 15:37:25,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,410 - INFO - Going to convert document batch...
2025-11-14 15:37:25,411 - INFO - Processing document 4_2025-11-10
2025-11-14 15:37:25,432 - INFO - Finished converting document 4_2025-11-10 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\4_2025-09-10' --> 'data\processed_data\AMZN\4_2025-09-10.md'
Converted 'data\edgar_documents\AMZN\4_2025-10-03' --> 'data\processed_data\AMZN\4_2025-10-03.md'
Converted 'data\edgar_documents\AMZN\4_2025-11-04' --> 'data\processed_data\AMZN\4_2025-11-04.md'


2025-11-14 15:37:25,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,477 - INFO - Going to convert document batch...
2025-11-14 15:37:25,477 - INFO - Processing document 8-K_2023-01-03
2025-11-14 15:37:25,500 - INFO - Finished converting document 8-K_2023-01-03 in 0.05 sec.
2025-11-14 15:37:25,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,536 - INFO - Going to convert document batch...
2025-11-14 15:37:25,536 - INFO - Processing document 8-K_2023-01-06
2025-11-14 15:37:25,561 - INFO - Finished converting document 8-K_2023-01-06 in 0.05 sec.
2025-11-14 15:37:25,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,599 - INFO - Going to convert document batch...
2025-11-14 15:37:25,599 - INFO - Processing document 8-K_2023-02-02
2025-11-14 15:37:25,622 - INFO - Finished converting document 8-K_2023-02-02 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2025-11-10' --> 'data\processed_data\AMZN\4_2025-11-10.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-01-03' --> 'data\processed_data\AMZN\8-K_2023-01-03.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-01-06' --> 'data\processed_data\AMZN\8-K_2023-01-06.md'


2025-11-14 15:37:25,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,665 - INFO - Going to convert document batch...
2025-11-14 15:37:25,666 - INFO - Processing document 8-K_2023-04-13
2025-11-14 15:37:25,689 - INFO - Finished converting document 8-K_2023-04-13 in 0.05 sec.
2025-11-14 15:37:25,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,729 - INFO - Going to convert document batch...
2025-11-14 15:37:25,729 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:37:25,751 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 15:37:25,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,819 - INFO - Going to convert document batch...
2025-11-14 15:37:25,820 - INFO - Processing document 8-K_2023-05-26


Converted 'data\edgar_documents\AMZN\8-K_2023-02-02' --> 'data\processed_data\AMZN\8-K_2023-02-02.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-04-13' --> 'data\processed_data\AMZN\8-K_2023-04-13.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-04-27' --> 'data\processed_data\AMZN\8-K_2023-04-27.md'


2025-11-14 15:37:25,928 - INFO - Finished converting document 8-K_2023-05-26 in 0.16 sec.
2025-11-14 15:37:26,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,027 - INFO - Going to convert document batch...
2025-11-14 15:37:26,028 - INFO - Processing document 8-K_2023-08-03
2025-11-14 15:37:26,052 - INFO - Finished converting document 8-K_2023-08-03 in 0.08 sec.
2025-11-14 15:37:26,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,093 - INFO - Going to convert document batch...
2025-11-14 15:37:26,094 - INFO - Processing document 8-K_2023-09-13
2025-11-14 15:37:26,110 - INFO - Finished converting document 8-K_2023-09-13 in 0.05 sec.
2025-11-14 15:37:26,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,146 - INFO - Going to convert document batch...
2025-11-14 15:37:26,146 - INFO - Processing document 8-K_2023-10-26
2025-11-14 15:37:26,167 - INFO - Finished converting document 8-K_2023-10-26 in 0.

Converted 'data\edgar_documents\AMZN\8-K_2023-05-26' --> 'data\processed_data\AMZN\8-K_2023-05-26.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-08-03' --> 'data\processed_data\AMZN\8-K_2023-08-03.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-09-13' --> 'data\processed_data\AMZN\8-K_2023-09-13.md'


2025-11-14 15:37:26,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,217 - INFO - Going to convert document batch...
2025-11-14 15:37:26,217 - INFO - Processing document 8-K_2023-11-01
2025-11-14 15:37:26,251 - INFO - Finished converting document 8-K_2023-11-01 in 0.06 sec.
2025-11-14 15:37:26,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,318 - INFO - Going to convert document batch...
2025-11-14 15:37:26,319 - INFO - Processing document 8-K_2024-02-01


Converted 'data\edgar_documents\AMZN\8-K_2023-10-26' --> 'data\processed_data\AMZN\8-K_2023-10-26.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-11-01' --> 'data\processed_data\AMZN\8-K_2023-11-01.md'


2025-11-14 15:37:26,373 - INFO - Finished converting document 8-K_2024-02-01 in 0.09 sec.
2025-11-14 15:37:26,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,421 - INFO - Going to convert document batch...
2025-11-14 15:37:26,422 - INFO - Processing document 8-K_2024-04-11
2025-11-14 15:37:26,446 - INFO - Finished converting document 8-K_2024-04-11 in 0.05 sec.
2025-11-14 15:37:26,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,483 - INFO - Going to convert document batch...
2025-11-14 15:37:26,484 - INFO - Processing document 8-K_2024-04-30
2025-11-14 15:37:26,504 - INFO - Finished converting document 8-K_2024-04-30 in 0.05 sec.
2025-11-14 15:37:26,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,570 - INFO - Going to convert document batch...
2025-11-14 15:37:26,571 - INFO - Processing document 8-K_2024-05-03
2025-11-14 15:37:26,594 - INFO - Finished converting document 8-K_2024-05-03 in 0.

Converted 'data\edgar_documents\AMZN\8-K_2024-02-01' --> 'data\processed_data\AMZN\8-K_2024-02-01.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-04-11' --> 'data\processed_data\AMZN\8-K_2024-04-11.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-04-30' --> 'data\processed_data\AMZN\8-K_2024-04-30.md'


2025-11-14 15:37:26,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,632 - INFO - Going to convert document batch...
2025-11-14 15:37:26,633 - INFO - Processing document 8-K_2024-05-14
2025-11-14 15:37:26,654 - INFO - Finished converting document 8-K_2024-05-14 in 0.05 sec.
2025-11-14 15:37:26,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,710 - INFO - Going to convert document batch...
2025-11-14 15:37:26,712 - INFO - Processing document 8-K_2024-05-24
2025-11-14 15:37:26,767 - INFO - Finished converting document 8-K_2024-05-24 in 0.09 sec.


Converted 'data\edgar_documents\AMZN\8-K_2024-05-03' --> 'data\processed_data\AMZN\8-K_2024-05-03.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-05-14' --> 'data\processed_data\AMZN\8-K_2024-05-14.md'


2025-11-14 15:37:26,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,820 - INFO - Going to convert document batch...
2025-11-14 15:37:26,820 - INFO - Processing document 8-K_2024-08-01
2025-11-14 15:37:26,845 - INFO - Finished converting document 8-K_2024-08-01 in 0.05 sec.
2025-11-14 15:37:26,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,880 - INFO - Going to convert document batch...
2025-11-14 15:37:26,881 - INFO - Processing document 8-K_2024-10-31
2025-11-14 15:37:26,908 - INFO - Finished converting document 8-K_2024-10-31 in 0.05 sec.
2025-11-14 15:37:26,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,966 - INFO - Going to convert document batch...
2025-11-14 15:37:26,967 - INFO - Processing document 8-K_2025-02-06
2025-11-14 15:37:26,987 - INFO - Finished converting document 8-K_2025-02-06 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\8-K_2024-05-24' --> 'data\processed_data\AMZN\8-K_2024-05-24.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-08-01' --> 'data\processed_data\AMZN\8-K_2024-08-01.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-10-31' --> 'data\processed_data\AMZN\8-K_2024-10-31.md'


2025-11-14 15:37:27,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,029 - INFO - Going to convert document batch...
2025-11-14 15:37:27,030 - INFO - Processing document 8-K_2025-04-10
2025-11-14 15:37:27,055 - INFO - Finished converting document 8-K_2025-04-10 in 0.05 sec.
2025-11-14 15:37:27,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,103 - INFO - Going to convert document batch...
2025-11-14 15:37:27,105 - INFO - Processing document 8-K_2025-05-01
2025-11-14 15:37:27,135 - INFO - Finished converting document 8-K_2025-05-01 in 0.06 sec.
2025-11-14 15:37:27,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,196 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\8-K_2025-02-06' --> 'data\processed_data\AMZN\8-K_2025-02-06.md'
Converted 'data\edgar_documents\AMZN\8-K_2025-04-10' --> 'data\processed_data\AMZN\8-K_2025-04-10.md'
Converted 'data\edgar_documents\AMZN\8-K_2025-05-01' --> 'data\processed_data\AMZN\8-K_2025-05-01.md'


2025-11-14 15:37:27,197 - INFO - Processing document 8-K_2025-05-22
2025-11-14 15:37:27,260 - INFO - Finished converting document 8-K_2025-05-22 in 0.12 sec.
2025-11-14 15:37:27,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,314 - INFO - Going to convert document batch...
2025-11-14 15:37:27,314 - INFO - Processing document 8-K_2025-07-31
2025-11-14 15:37:27,335 - INFO - Finished converting document 8-K_2025-07-31 in 0.05 sec.
2025-11-14 15:37:27,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,372 - INFO - Going to convert document batch...
2025-11-14 15:37:27,373 - INFO - Processing document 8-K_2025-10-30
2025-11-14 15:37:27,395 - INFO - Finished converting document 8-K_2025-10-30 in 0.05 sec.
2025-11-14 15:37:27,443 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:37:27,444 - ERROR - Input document DEF-14A_2023-04-13 with format None does not match any 

Converted 'data\edgar_documents\AMZN\8-K_2025-05-22' --> 'data\processed_data\AMZN\8-K_2025-05-22.md'
Converted 'data\edgar_documents\AMZN\8-K_2025-07-31' --> 'data\processed_data\AMZN\8-K_2025-07-31.md'
Converted 'data\edgar_documents\AMZN\8-K_2025-10-30' --> 'data\processed_data\AMZN\8-K_2025-10-30.md'
Error processing data\edgar_documents\AMZN\DEF-14A_2023-04-13: File format not allowed: data\edgar_documents\AMZN\DEF-14A_2023-04-13


2025-11-14 15:37:27,480 - ERROR - Input document DEF-14A_2024-04-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:37:27,481 - INFO - Going to convert document batch...
2025-11-14 15:37:27,512 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:37:27,512 - ERROR - Input document DEF-14A_2025-04-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: '

Error processing data\edgar_documents\AMZN\DEF-14A_2024-04-11: File format not allowed: data\edgar_documents\AMZN\DEF-14A_2024-04-11
Error processing data\edgar_documents\AMZN\DEF-14A_2025-04-10: File format not allowed: data\edgar_documents\AMZN\DEF-14A_2025-04-10
Processed 166 new files. Errors: 3
Found 156 files to process in data\edgar_documents\AVGO


2025-11-14 15:37:28,330 - INFO - Going to convert document batch...
2025-11-14 15:37:28,330 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:37:28,331 - INFO - Processing document 10-K_2023-12-14
2025-11-14 15:37:29,611 - INFO - Finished converting document 10-K_2023-12-14 in 2.09 sec.
2025-11-14 15:37:30,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-K_2023-12-14' --> 'data\processed_data\AVGO\10-K_2023-12-14.md'


2025-11-14 15:37:31,075 - INFO - Going to convert document batch...
2025-11-14 15:37:31,076 - INFO - Processing document 10-K_2024-12-20
2025-11-14 15:37:32,508 - INFO - Finished converting document 10-K_2024-12-20 in 2.31 sec.
2025-11-14 15:37:33,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-K_2024-12-20' --> 'data\processed_data\AVGO\10-K_2024-12-20.md'


2025-11-14 15:37:33,851 - INFO - Going to convert document batch...
2025-11-14 15:37:33,852 - INFO - Processing document 10-Q_2023-03-08
2025-11-14 15:37:34,572 - INFO - Finished converting document 10-Q_2023-03-08 in 1.41 sec.
2025-11-14 15:37:35,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2023-03-08' --> 'data\processed_data\AVGO\10-Q_2023-03-08.md'


2025-11-14 15:37:36,235 - INFO - Going to convert document batch...
2025-11-14 15:37:36,237 - INFO - Processing document 10-Q_2023-06-07
2025-11-14 15:37:38,225 - INFO - Finished converting document 10-Q_2023-06-07 in 2.94 sec.
2025-11-14 15:37:39,238 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2023-06-07' --> 'data\processed_data\AVGO\10-Q_2023-06-07.md'


2025-11-14 15:37:41,148 - INFO - Going to convert document batch...
2025-11-14 15:37:41,149 - INFO - Processing document 10-Q_2023-09-06
2025-11-14 15:37:43,051 - INFO - Finished converting document 10-Q_2023-09-06 in 3.84 sec.
2025-11-14 15:37:44,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2023-09-06' --> 'data\processed_data\AVGO\10-Q_2023-09-06.md'


2025-11-14 15:37:45,242 - INFO - Going to convert document batch...
2025-11-14 15:37:45,243 - INFO - Processing document 10-Q_2024-03-14
2025-11-14 15:37:47,461 - INFO - Finished converting document 10-Q_2024-03-14 in 3.09 sec.
2025-11-14 15:37:48,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2024-03-14' --> 'data\processed_data\AVGO\10-Q_2024-03-14.md'


2025-11-14 15:37:50,647 - INFO - Going to convert document batch...
2025-11-14 15:37:50,648 - INFO - Processing document 10-Q_2024-06-13
2025-11-14 15:37:53,258 - INFO - Finished converting document 10-Q_2024-06-13 in 4.73 sec.
2025-11-14 15:37:54,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2024-06-13' --> 'data\processed_data\AVGO\10-Q_2024-06-13.md'


2025-11-14 15:37:56,283 - INFO - Going to convert document batch...
2025-11-14 15:37:56,286 - INFO - Processing document 10-Q_2024-09-11
2025-11-14 15:37:58,768 - INFO - Finished converting document 10-Q_2024-09-11 in 4.31 sec.
2025-11-14 15:38:00,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2024-09-11' --> 'data\processed_data\AVGO\10-Q_2024-09-11.md'


2025-11-14 15:38:01,074 - INFO - Going to convert document batch...
2025-11-14 15:38:01,075 - INFO - Processing document 10-Q_2025-03-12
2025-11-14 15:38:02,646 - INFO - Finished converting document 10-Q_2025-03-12 in 2.66 sec.
2025-11-14 15:38:03,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2025-03-12' --> 'data\processed_data\AVGO\10-Q_2025-03-12.md'


2025-11-14 15:38:05,755 - INFO - Going to convert document batch...
2025-11-14 15:38:05,756 - INFO - Processing document 10-Q_2025-06-11
2025-11-14 15:38:07,675 - INFO - Finished converting document 10-Q_2025-06-11 in 4.05 sec.
2025-11-14 15:38:08,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2025-06-11' --> 'data\processed_data\AVGO\10-Q_2025-06-11.md'


2025-11-14 15:38:10,591 - INFO - Going to convert document batch...
2025-11-14 15:38:10,592 - INFO - Processing document 10-Q_2025-09-10
2025-11-14 15:38:13,028 - INFO - Finished converting document 10-Q_2025-09-10 in 4.33 sec.
2025-11-14 15:38:14,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:14,486 - INFO - Going to convert document batch...
2025-11-14 15:38:14,487 - INFO - Processing document 4_2023-01-06
2025-11-14 15:38:14,555 - INFO - Finished converting document 4_2023-01-06 in 0.09 sec.
2025-11-14 15:38:14,653 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\AVGO\10-Q_2025-09-10' --> 'data\processed_data\AVGO\10-Q_2025-09-10.md'
Converted 'data\edgar_documents\AVGO\4_2023-01-06' --> 'data\processed_data\AVGO\4_2023-01-06.md'


2025-11-14 15:38:14,654 - ERROR - Input document 4_2023-01-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:14,655 - INFO - Going to convert document batch...
2025-11-14 15:38:14,692 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:14,693 - ERROR - Input document 4_2023-01-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\AVGO\4_2023-01-09: File format not allowed: data\edgar_documents\AVGO\4_2023-01-09
Error processing data\edgar_documents\AVGO\4_2023-01-12: File format not allowed: data\edgar_documents\AVGO\4_2023-01-12
Error processing data\edgar_documents\AVGO\4_2023-01-23: File format not allowed: data\edgar_documents\AVGO\4_2023-01-23
Error processing data\edgar_documents\AVGO\4_2023-01-31: File format not allowed: data\edgar_documents\AVGO\4_2023-01-31
Error processing data\edgar_documents\AVGO\4_2023-02-09: File format not allowed: data\edgar_documents\AVGO\4_2023-02-09


2025-11-14 15:38:14,847 - ERROR - Input document 4_2023-02-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:14,849 - INFO - Going to convert document batch...
2025-11-14 15:38:14,874 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:14,876 - ERROR - Input document 4_2023-03-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\AVGO\4_2023-02-15: File format not allowed: data\edgar_documents\AVGO\4_2023-02-15
Error processing data\edgar_documents\AVGO\4_2023-03-09: File format not allowed: data\edgar_documents\AVGO\4_2023-03-09
Converted 'data\edgar_documents\AVGO\4_2023-03-10' --> 'data\processed_data\AVGO\4_2023-03-10.md'


2025-11-14 15:38:15,059 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:15,061 - ERROR - Input document 4_2023-03-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:15,063 - INFO - Going to convert document batch...
2025-11-14 15:38:15,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:15,116 - INFO - Going to convert document batch...
2025-11-14 15:38:15,118 - INFO - Processing document 4_2023-03-16
2025-11-14 15:38:15,187 - INFO - Fin

Error processing data\edgar_documents\AVGO\4_2023-03-15: File format not allowed: data\edgar_documents\AVGO\4_2023-03-15
Converted 'data\edgar_documents\AVGO\4_2023-03-16' --> 'data\processed_data\AVGO\4_2023-03-16.md'


2025-11-14 15:38:15,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:15,339 - INFO - Going to convert document batch...
2025-11-14 15:38:15,343 - INFO - Processing document 4_2023-03-17
2025-11-14 15:38:15,411 - INFO - Finished converting document 4_2023-03-17 in 0.14 sec.
2025-11-14 15:38:15,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:15,487 - INFO - Going to convert document batch...
2025-11-14 15:38:15,490 - INFO - Processing document 4_2023-03-20
2025-11-14 15:38:15,540 - INFO - Finished converting document 4_2023-03-20 in 0.08 sec.
2025-11-14 15:38:15,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2023-03-17' --> 'data\processed_data\AVGO\4_2023-03-17.md'
Converted 'data\edgar_documents\AVGO\4_2023-03-20' --> 'data\processed_data\AVGO\4_2023-03-20.md'


2025-11-14 15:38:15,649 - INFO - Going to convert document batch...
2025-11-14 15:38:15,652 - INFO - Processing document 4_2023-03-29
2025-11-14 15:38:15,737 - INFO - Finished converting document 4_2023-03-29 in 0.14 sec.
2025-11-14 15:38:15,833 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:15,834 - ERROR - Input document 4_2023-03-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:15,836 - INFO - Going to convert document batch...
2025-11-14 15:38:15,851 - IN

Converted 'data\edgar_documents\AVGO\4_2023-03-29' --> 'data\processed_data\AVGO\4_2023-03-29.md'
Error processing data\edgar_documents\AVGO\4_2023-03-30: File format not allowed: data\edgar_documents\AVGO\4_2023-03-30
Converted 'data\edgar_documents\AVGO\4_2023-04-05' --> 'data\processed_data\AVGO\4_2023-04-05.md'


2025-11-14 15:38:16,025 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,027 - ERROR - Input document 4_2023-04-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:16,029 - INFO - Going to convert document batch...
2025-11-14 15:38:16,051 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,052 - ERROR - Input document 4_2023-05-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AVGO\4_2023-04-25: File format not allowed: data\edgar_documents\AVGO\4_2023-04-25
Error processing data\edgar_documents\AVGO\4_2023-05-04: File format not allowed: data\edgar_documents\AVGO\4_2023-05-04
Error processing data\edgar_documents\AVGO\4_2023-06-07: File format not allowed: data\edgar_documents\AVGO\4_2023-06-07


2025-11-14 15:38:16,259 - INFO - Finished converting document 4_2023-06-12 in 0.14 sec.
2025-11-14 15:38:16,373 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,374 - ERROR - Input document 4_2023-06-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:16,376 - INFO - Going to convert document batch...
2025-11-14 15:38:16,393 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,395 - ERROR - Input document 4_2023-06-27 with forma

Converted 'data\edgar_documents\AVGO\4_2023-06-12' --> 'data\processed_data\AVGO\4_2023-06-12.md'
Error processing data\edgar_documents\AVGO\4_2023-06-26: File format not allowed: data\edgar_documents\AVGO\4_2023-06-26
Error processing data\edgar_documents\AVGO\4_2023-06-27: File format not allowed: data\edgar_documents\AVGO\4_2023-06-27


2025-11-14 15:38:16,607 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,609 - ERROR - Input document 4_2023-06-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:16,611 - INFO - Going to convert document batch...
2025-11-14 15:38:16,653 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,655 - ERROR - Input document 4_2023-07-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\AVGO\4_2023-06-29' --> 'data\processed_data\AVGO\4_2023-06-29.md'
Error processing data\edgar_documents\AVGO\4_2023-06-30: File format not allowed: data\edgar_documents\AVGO\4_2023-06-30
Error processing data\edgar_documents\AVGO\4_2023-07-12: File format not allowed: data\edgar_documents\AVGO\4_2023-07-12
Error processing data\edgar_documents\AVGO\4_2023-08-21: File format not allowed: data\edgar_documents\AVGO\4_2023-08-21
Error processing data\edgar_documents\AVGO\4_2023-08-28: File format not allowed: data\edgar_documents\AVGO\4_2023-08-28


2025-11-14 15:38:16,782 - INFO - Going to convert document batch...
2025-11-14 15:38:16,785 - INFO - Processing document 4_2023-09-08
2025-11-14 15:38:16,841 - INFO - Finished converting document 4_2023-09-08 in 0.11 sec.
2025-11-14 15:38:16,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:16,948 - INFO - Going to convert document batch...
2025-11-14 15:38:16,951 - INFO - Processing document 4_2023-09-14
2025-11-14 15:38:17,009 - INFO - Finished converting document 4_2023-09-14 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2023-09-08' --> 'data\processed_data\AVGO\4_2023-09-08.md'
Converted 'data\edgar_documents\AVGO\4_2023-09-14' --> 'data\processed_data\AVGO\4_2023-09-14.md'


2025-11-14 15:38:17,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:17,111 - INFO - Going to convert document batch...
2025-11-14 15:38:17,113 - INFO - Processing document 4_2023-09-19
2025-11-14 15:38:17,175 - INFO - Finished converting document 4_2023-09-19 in 0.11 sec.
2025-11-14 15:38:17,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:17,300 - INFO - Going to convert document batch...
2025-11-14 15:38:17,303 - INFO - Processing document 4_2023-09-26
2025-11-14 15:38:17,362 - INFO - Finished converting document 4_2023-09-26 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2023-09-19' --> 'data\processed_data\AVGO\4_2023-09-19.md'
Converted 'data\edgar_documents\AVGO\4_2023-09-26' --> 'data\processed_data\AVGO\4_2023-09-26.md'


2025-11-14 15:38:17,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:17,483 - INFO - Going to convert document batch...
2025-11-14 15:38:17,486 - INFO - Processing document 4_2023-10-06
2025-11-14 15:38:17,557 - INFO - Finished converting document 4_2023-10-06 in 0.14 sec.
2025-11-14 15:38:17,647 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:17,649 - ERROR - Input document 4_2023-10-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38

Converted 'data\edgar_documents\AVGO\4_2023-10-06' --> 'data\processed_data\AVGO\4_2023-10-06.md'
Error processing data\edgar_documents\AVGO\4_2023-10-18: File format not allowed: data\edgar_documents\AVGO\4_2023-10-18
Error processing data\edgar_documents\AVGO\4_2023-10-30: File format not allowed: data\edgar_documents\AVGO\4_2023-10-30


2025-11-14 15:38:17,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:17,923 - INFO - Going to convert document batch...
2025-11-14 15:38:17,925 - INFO - Processing document 4_2023-12-15
2025-11-14 15:38:18,007 - INFO - Finished converting document 4_2023-12-15 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2023-11-07' --> 'data\processed_data\AVGO\4_2023-11-07.md'
Converted 'data\edgar_documents\AVGO\4_2023-12-15' --> 'data\processed_data\AVGO\4_2023-12-15.md'


2025-11-14 15:38:18,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:18,144 - INFO - Going to convert document batch...
2025-11-14 15:38:18,147 - INFO - Processing document 4_2023-12-18
2025-11-14 15:38:18,209 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.
2025-11-14 15:38:18,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:18,322 - INFO - Going to convert document batch...
2025-11-14 15:38:18,325 - INFO - Processing document 4_2023-12-19
2025-11-14 15:38:18,380 - INFO - Finished converting document 4_2023-12-19 in 0.09 sec.
2025-11-14 15:38:18,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2023-12-18' --> 'data\processed_data\AVGO\4_2023-12-18.md'
Converted 'data\edgar_documents\AVGO\4_2023-12-19' --> 'data\processed_data\AVGO\4_2023-12-19.md'


2025-11-14 15:38:18,519 - INFO - Going to convert document batch...
2025-11-14 15:38:18,522 - INFO - Processing document 4_2023-12-22
2025-11-14 15:38:18,664 - INFO - Finished converting document 4_2023-12-22 in 0.23 sec.
2025-11-14 15:38:18,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:18,750 - INFO - Going to convert document batch...
2025-11-14 15:38:18,751 - INFO - Processing document 4_2024-01-08
2025-11-14 15:38:18,797 - INFO - Finished converting document 4_2024-01-08 in 0.08 sec.
2025-11-14 15:38:18,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:18,883 - INFO - Going to convert document batch...
2025-11-14 15:38:18,883 - INFO - Processing document 4_2024-01-09


Converted 'data\edgar_documents\AVGO\4_2023-12-22' --> 'data\processed_data\AVGO\4_2023-12-22.md'
Converted 'data\edgar_documents\AVGO\4_2024-01-08' --> 'data\processed_data\AVGO\4_2024-01-08.md'


2025-11-14 15:38:18,937 - INFO - Finished converting document 4_2024-01-09 in 0.09 sec.
2025-11-14 15:38:18,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,008 - INFO - Going to convert document batch...
2025-11-14 15:38:19,009 - INFO - Processing document 4_2024-02-07
2025-11-14 15:38:19,055 - INFO - Finished converting document 4_2024-02-07 in 0.06 sec.
2025-11-14 15:38:19,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,152 - INFO - Going to convert document batch...
2025-11-14 15:38:19,155 - INFO - Processing document 4_2024-03-07


Converted 'data\edgar_documents\AVGO\4_2024-01-09' --> 'data\processed_data\AVGO\4_2024-01-09.md'
Converted 'data\edgar_documents\AVGO\4_2024-02-07' --> 'data\processed_data\AVGO\4_2024-02-07.md'


2025-11-14 15:38:19,223 - INFO - Finished converting document 4_2024-03-07 in 0.12 sec.
2025-11-14 15:38:19,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,347 - INFO - Going to convert document batch...
2025-11-14 15:38:19,351 - INFO - Processing document 4_2024-03-14
2025-11-14 15:38:19,403 - INFO - Finished converting document 4_2024-03-14 in 0.11 sec.
2025-11-14 15:38:19,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2024-03-07' --> 'data\processed_data\AVGO\4_2024-03-07.md'
Converted 'data\edgar_documents\AVGO\4_2024-03-14' --> 'data\processed_data\AVGO\4_2024-03-14.md'


2025-11-14 15:38:19,528 - INFO - Going to convert document batch...
2025-11-14 15:38:19,530 - INFO - Processing document 4_2024-03-19
2025-11-14 15:38:19,590 - INFO - Finished converting document 4_2024-03-19 in 0.14 sec.
2025-11-14 15:38:19,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,712 - INFO - Going to convert document batch...
2025-11-14 15:38:19,714 - INFO - Processing document 4_2024-03-21
2025-11-14 15:38:19,775 - INFO - Finished converting document 4_2024-03-21 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2024-03-19' --> 'data\processed_data\AVGO\4_2024-03-19.md'
Converted 'data\edgar_documents\AVGO\4_2024-03-21' --> 'data\processed_data\AVGO\4_2024-03-21.md'


2025-11-14 15:38:19,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,894 - INFO - Going to convert document batch...
2025-11-14 15:38:19,896 - INFO - Processing document 4_2024-03-27
2025-11-14 15:38:19,937 - INFO - Finished converting document 4_2024-03-27 in 0.11 sec.
2025-11-14 15:38:19,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,001 - INFO - Going to convert document batch...
2025-11-14 15:38:20,002 - INFO - Processing document 4_2024-04-01
2025-11-14 15:38:20,049 - INFO - Finished converting document 4_2024-04-01 in 0.08 sec.


Converted 'data\edgar_documents\AVGO\4_2024-03-27' --> 'data\processed_data\AVGO\4_2024-03-27.md'
Converted 'data\edgar_documents\AVGO\4_2024-04-01' --> 'data\processed_data\AVGO\4_2024-04-01.md'


2025-11-14 15:38:20,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,171 - INFO - Going to convert document batch...
2025-11-14 15:38:20,172 - INFO - Processing document 4_2024-04-04
2025-11-14 15:38:20,217 - INFO - Finished converting document 4_2024-04-04 in 0.09 sec.
2025-11-14 15:38:20,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,308 - INFO - Going to convert document batch...
2025-11-14 15:38:20,310 - INFO - Processing document 4_2024-04-05
2025-11-14 15:38:20,360 - INFO - Finished converting document 4_2024-04-05 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2024-04-04' --> 'data\processed_data\AVGO\4_2024-04-04.md'
Converted 'data\edgar_documents\AVGO\4_2024-04-05' --> 'data\processed_data\AVGO\4_2024-04-05.md'


2025-11-14 15:38:20,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,466 - INFO - Going to convert document batch...
2025-11-14 15:38:20,468 - INFO - Processing document 4_2024-04-09
2025-11-14 15:38:20,538 - INFO - Finished converting document 4_2024-04-09 in 0.12 sec.
2025-11-14 15:38:20,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,653 - INFO - Going to convert document batch...
2025-11-14 15:38:20,656 - INFO - Processing document 4_2024-04-12
2025-11-14 15:38:20,731 - INFO - Finished converting document 4_2024-04-12 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2024-04-09' --> 'data\processed_data\AVGO\4_2024-04-09.md'
Converted 'data\edgar_documents\AVGO\4_2024-04-12' --> 'data\processed_data\AVGO\4_2024-04-12.md'


2025-11-14 15:38:20,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,815 - INFO - Going to convert document batch...
2025-11-14 15:38:20,816 - INFO - Processing document 4_2024-04-17
2025-11-14 15:38:20,880 - INFO - Finished converting document 4_2024-04-17 in 0.11 sec.
2025-11-14 15:38:20,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,994 - INFO - Going to convert document batch...
2025-11-14 15:38:20,996 - INFO - Processing document 4_2024-04-24
2025-11-14 15:38:21,052 - INFO - Finished converting document 4_2024-04-24 in 0.11 sec.
2025-11-14 15:38:21,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:21,126 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AVGO\4_2024-04-17' --> 'data\processed_data\AVGO\4_2024-04-17.md'
Converted 'data\edgar_documents\AVGO\4_2024-04-24' --> 'data\processed_data\AVGO\4_2024-04-24.md'


2025-11-14 15:38:21,128 - INFO - Processing document 4_2024-06-20
2025-11-14 15:38:21,200 - INFO - Finished converting document 4_2024-06-20 in 0.11 sec.
2025-11-14 15:38:21,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:21,324 - INFO - Going to convert document batch...
2025-11-14 15:38:21,327 - INFO - Processing document 4_2024-06-24
2025-11-14 15:38:21,373 - INFO - Finished converting document 4_2024-06-24 in 0.09 sec.
2025-11-14 15:38:21,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2024-06-20' --> 'data\processed_data\AVGO\4_2024-06-20.md'
Converted 'data\edgar_documents\AVGO\4_2024-06-24' --> 'data\processed_data\AVGO\4_2024-06-24.md'


2025-11-14 15:38:21,461 - INFO - Going to convert document batch...
2025-11-14 15:38:21,462 - INFO - Processing document 4_2024-06-25
2025-11-14 15:38:21,494 - INFO - Finished converting document 4_2024-06-25 in 0.09 sec.
2025-11-14 15:38:21,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:21,589 - INFO - Going to convert document batch...
2025-11-14 15:38:21,591 - INFO - Processing document 4_2024-06-27
2025-11-14 15:38:21,657 - INFO - Finished converting document 4_2024-06-27 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2024-06-25' --> 'data\processed_data\AVGO\4_2024-06-25.md'


2025-11-14 15:38:21,765 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:21,766 - ERROR - Input document 4_2024-07-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:21,770 - INFO - Going to convert document batch...
2025-11-14 15:38:21,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:21,812 - INFO - Going to convert document batch...
2025-11-14 15:38:21,813 - INFO - Processing document 4_2024-07-09
2025-11-14 15:38:21,856 - INFO - Fin

Converted 'data\edgar_documents\AVGO\4_2024-06-27' --> 'data\processed_data\AVGO\4_2024-06-27.md'
Error processing data\edgar_documents\AVGO\4_2024-07-08: File format not allowed: data\edgar_documents\AVGO\4_2024-07-08
Converted 'data\edgar_documents\AVGO\4_2024-07-09' --> 'data\processed_data\AVGO\4_2024-07-09.md'


2025-11-14 15:38:21,979 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:21,982 - ERROR - Input document 4_2024-07-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:21,984 - INFO - Going to convert document batch...
2025-11-14 15:38:22,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:22,033 - INFO - Going to convert document batch...
2025-11-14 15:38:22,036 - INFO - Processing document 4_2024-07-15
2025-11-14 15:38:22,079 - INFO - Fin

Error processing data\edgar_documents\AVGO\4_2024-07-10: File format not allowed: data\edgar_documents\AVGO\4_2024-07-10
Converted 'data\edgar_documents\AVGO\4_2024-07-15' --> 'data\processed_data\AVGO\4_2024-07-15.md'


2025-11-14 15:38:22,183 - INFO - Processing document 4_2024-09-19
2025-11-14 15:38:22,253 - INFO - Finished converting document 4_2024-09-19 in 0.12 sec.
2025-11-14 15:38:22,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:22,344 - INFO - Going to convert document batch...
2025-11-14 15:38:22,346 - INFO - Processing document 4_2024-09-23
2025-11-14 15:38:22,393 - INFO - Finished converting document 4_2024-09-23 in 0.09 sec.
2025-11-14 15:38:22,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2024-09-19' --> 'data\processed_data\AVGO\4_2024-09-19.md'
Converted 'data\edgar_documents\AVGO\4_2024-09-23' --> 'data\processed_data\AVGO\4_2024-09-23.md'


2025-11-14 15:38:22,513 - INFO - Going to convert document batch...
2025-11-14 15:38:22,514 - INFO - Processing document 4_2024-09-26
2025-11-14 15:38:22,575 - INFO - Finished converting document 4_2024-09-26 in 0.12 sec.
2025-11-14 15:38:22,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:22,681 - INFO - Going to convert document batch...
2025-11-14 15:38:22,683 - INFO - Processing document 4_2024-09-27
2025-11-14 15:38:22,742 - INFO - Finished converting document 4_2024-09-27 in 0.09 sec.
2025-11-14 15:38:22,821 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:22,823 - ERROR - Input document 4_2024-09-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\AVGO\4_2024-09-26' --> 'data\processed_data\AVGO\4_2024-09-26.md'
Converted 'data\edgar_documents\AVGO\4_2024-09-27' --> 'data\processed_data\AVGO\4_2024-09-27.md'


2025-11-14 15:38:22,826 - INFO - Going to convert document batch...
2025-11-14 15:38:22,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:22,885 - INFO - Going to convert document batch...
2025-11-14 15:38:22,889 - INFO - Processing document 4_2024-10-03
2025-11-14 15:38:22,964 - INFO - Finished converting document 4_2024-10-03 in 0.14 sec.


Error processing data\edgar_documents\AVGO\4_2024-09-30: File format not allowed: data\edgar_documents\AVGO\4_2024-09-30
Converted 'data\edgar_documents\AVGO\4_2024-10-03' --> 'data\processed_data\AVGO\4_2024-10-03.md'


2025-11-14 15:38:23,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,067 - INFO - Going to convert document batch...
2025-11-14 15:38:23,070 - INFO - Processing document 4_2024-10-07
2025-11-14 15:38:23,120 - INFO - Finished converting document 4_2024-10-07 in 0.12 sec.
2025-11-14 15:38:23,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,191 - INFO - Going to convert document batch...
2025-11-14 15:38:23,193 - INFO - Processing document 4_2024-10-09
2025-11-14 15:38:23,277 - INFO - Finished converting document 4_2024-10-09 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2024-10-07' --> 'data\processed_data\AVGO\4_2024-10-07.md'
Converted 'data\edgar_documents\AVGO\4_2024-10-09' --> 'data\processed_data\AVGO\4_2024-10-09.md'


2025-11-14 15:38:23,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,387 - INFO - Going to convert document batch...
2025-11-14 15:38:23,389 - INFO - Processing document 4_2024-10-11
2025-11-14 15:38:23,453 - INFO - Finished converting document 4_2024-10-11 in 0.12 sec.
2025-11-14 15:38:23,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,567 - INFO - Going to convert document batch...
2025-11-14 15:38:23,568 - INFO - Processing document 4_2024-10-16
2025-11-14 15:38:23,630 - INFO - Finished converting document 4_2024-10-16 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2024-10-11' --> 'data\processed_data\AVGO\4_2024-10-11.md'
Converted 'data\edgar_documents\AVGO\4_2024-10-16' --> 'data\processed_data\AVGO\4_2024-10-16.md'


2025-11-14 15:38:23,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,774 - INFO - Going to convert document batch...
2025-11-14 15:38:23,776 - INFO - Processing document 4_2024-11-08
2025-11-14 15:38:23,837 - INFO - Finished converting document 4_2024-11-08 in 0.14 sec.
2025-11-14 15:38:23,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,938 - INFO - Going to convert document batch...
2025-11-14 15:38:23,940 - INFO - Processing document 4_2024-12-18
2025-11-14 15:38:23,997 - INFO - Finished converting document 4_2024-12-18 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2024-11-08' --> 'data\processed_data\AVGO\4_2024-11-08.md'
Converted 'data\edgar_documents\AVGO\4_2024-12-18' --> 'data\processed_data\AVGO\4_2024-12-18.md'


2025-11-14 15:38:24,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:24,114 - INFO - Going to convert document batch...
2025-11-14 15:38:24,116 - INFO - Processing document 4_2024-12-19
2025-11-14 15:38:24,183 - INFO - Finished converting document 4_2024-12-19 in 0.12 sec.
2025-11-14 15:38:24,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:24,312 - INFO - Going to convert document batch...
2025-11-14 15:38:24,315 - INFO - Processing document 4_2024-12-26
2025-11-14 15:38:24,375 - INFO - Finished converting document 4_2024-12-26 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2024-12-19' --> 'data\processed_data\AVGO\4_2024-12-19.md'
Converted 'data\edgar_documents\AVGO\4_2024-12-26' --> 'data\processed_data\AVGO\4_2024-12-26.md'


2025-11-14 15:38:24,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:24,490 - INFO - Going to convert document batch...
2025-11-14 15:38:24,492 - INFO - Processing document 4_2024-12-27
2025-11-14 15:38:24,549 - INFO - Finished converting document 4_2024-12-27 in 0.12 sec.
2025-11-14 15:38:24,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2024-12-27' --> 'data\processed_data\AVGO\4_2024-12-27.md'


2025-11-14 15:38:25,601 - INFO - Going to convert document batch...
2025-11-14 15:38:25,602 - INFO - Processing document 4_2025-01-06
2025-11-14 15:38:25,689 - INFO - Finished converting document 4_2025-01-06 in 1.05 sec.
2025-11-14 15:38:25,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:25,821 - INFO - Going to convert document batch...
2025-11-14 15:38:25,823 - INFO - Processing document 4_2025-01-08
2025-11-14 15:38:25,880 - INFO - Finished converting document 4_2025-01-08 in 0.11 sec.
2025-11-14 15:38:25,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-01-06' --> 'data\processed_data\AVGO\4_2025-01-06.md'
Converted 'data\edgar_documents\AVGO\4_2025-01-08' --> 'data\processed_data\AVGO\4_2025-01-08.md'


2025-11-14 15:38:25,986 - INFO - Going to convert document batch...
2025-11-14 15:38:25,988 - INFO - Processing document 4_2025-01-10
2025-11-14 15:38:26,059 - INFO - Finished converting document 4_2025-01-10 in 0.12 sec.
2025-11-14 15:38:26,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,172 - INFO - Going to convert document batch...
2025-11-14 15:38:26,174 - INFO - Processing document 4_2025-03-06
2025-11-14 15:38:26,256 - INFO - Finished converting document 4_2025-03-06 in 0.14 sec.


Converted 'data\edgar_documents\AVGO\4_2025-01-10' --> 'data\processed_data\AVGO\4_2025-01-10.md'
Converted 'data\edgar_documents\AVGO\4_2025-03-06' --> 'data\processed_data\AVGO\4_2025-03-06.md'


2025-11-14 15:38:26,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,383 - INFO - Going to convert document batch...
2025-11-14 15:38:26,387 - INFO - Processing document 4_2025-03-18
2025-11-14 15:38:26,455 - INFO - Finished converting document 4_2025-03-18 in 0.14 sec.
2025-11-14 15:38:26,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,588 - INFO - Going to convert document batch...
2025-11-14 15:38:26,590 - INFO - Processing document 4_2025-03-19
2025-11-14 15:38:26,659 - INFO - Finished converting document 4_2025-03-19 in 0.14 sec.


Converted 'data\edgar_documents\AVGO\4_2025-03-18' --> 'data\processed_data\AVGO\4_2025-03-18.md'
Converted 'data\edgar_documents\AVGO\4_2025-03-19' --> 'data\processed_data\AVGO\4_2025-03-19.md'


2025-11-14 15:38:26,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,790 - INFO - Going to convert document batch...
2025-11-14 15:38:26,793 - INFO - Processing document 4_2025-03-26
2025-11-14 15:38:26,840 - INFO - Finished converting document 4_2025-03-26 in 0.14 sec.
2025-11-14 15:38:26,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,976 - INFO - Going to convert document batch...
2025-11-14 15:38:26,979 - INFO - Processing document 4_2025-03-28


Converted 'data\edgar_documents\AVGO\4_2025-03-26' --> 'data\processed_data\AVGO\4_2025-03-26.md'


2025-11-14 15:38:27,101 - INFO - Finished converting document 4_2025-03-28 in 0.20 sec.
2025-11-14 15:38:27,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,251 - INFO - Going to convert document batch...
2025-11-14 15:38:27,252 - INFO - Processing document 4_2025-04-15
2025-11-14 15:38:27,290 - INFO - Finished converting document 4_2025-04-15 in 0.08 sec.
2025-11-14 15:38:27,343 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,360 - INFO - Going to convert document batch...
2025-11-14 15:38:27,361 - INFO - Processing document 4_2025-04-16
2025-11-14 15:38:27,399 - INFO - Finished converting document 4_2025-04-16 in 0.06 sec.


Converted 'data\edgar_documents\AVGO\4_2025-03-28' --> 'data\processed_data\AVGO\4_2025-03-28.md'
Converted 'data\edgar_documents\AVGO\4_2025-04-15' --> 'data\processed_data\AVGO\4_2025-04-15.md'


2025-11-14 15:38:27,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,509 - INFO - Going to convert document batch...
2025-11-14 15:38:27,513 - INFO - Processing document 4_2025-04-23
2025-11-14 15:38:27,579 - INFO - Finished converting document 4_2025-04-23 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2025-04-16' --> 'data\processed_data\AVGO\4_2025-04-16.md'
Converted 'data\edgar_documents\AVGO\4_2025-04-23' --> 'data\processed_data\AVGO\4_2025-04-23.md'


2025-11-14 15:38:27,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,694 - INFO - Going to convert document batch...
2025-11-14 15:38:27,696 - INFO - Processing document 4_2025-05-16
2025-11-14 15:38:27,752 - INFO - Finished converting document 4_2025-05-16 in 0.11 sec.
2025-11-14 15:38:27,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,859 - INFO - Going to convert document batch...
2025-11-14 15:38:27,861 - INFO - Processing document 4_2025-06-13
2025-11-14 15:38:27,917 - INFO - Finished converting document 4_2025-06-13 in 0.11 sec.
2025-11-14 15:38:28,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-05-16' --> 'data\processed_data\AVGO\4_2025-05-16.md'
Converted 'data\edgar_documents\AVGO\4_2025-06-13' --> 'data\processed_data\AVGO\4_2025-06-13.md'


2025-11-14 15:38:28,031 - INFO - Going to convert document batch...
2025-11-14 15:38:28,032 - INFO - Processing document 4_2025-06-16
2025-11-14 15:38:28,102 - INFO - Finished converting document 4_2025-06-16 in 0.11 sec.
2025-11-14 15:38:28,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:28,189 - INFO - Going to convert document batch...
2025-11-14 15:38:28,192 - INFO - Processing document 4_2025-06-18
2025-11-14 15:38:28,263 - INFO - Finished converting document 4_2025-06-18 in 0.11 sec.
2025-11-14 15:38:28,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-06-16' --> 'data\processed_data\AVGO\4_2025-06-16.md'
Converted 'data\edgar_documents\AVGO\4_2025-06-18' --> 'data\processed_data\AVGO\4_2025-06-18.md'


2025-11-14 15:38:28,362 - INFO - Going to convert document batch...
2025-11-14 15:38:28,364 - INFO - Processing document 4_2025-06-23
2025-11-14 15:38:28,432 - INFO - Finished converting document 4_2025-06-23 in 0.12 sec.
2025-11-14 15:38:28,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:28,545 - INFO - Going to convert document batch...
2025-11-14 15:38:28,547 - INFO - Processing document 4_2025-06-25
2025-11-14 15:38:28,612 - INFO - Finished converting document 4_2025-06-25 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2025-06-23' --> 'data\processed_data\AVGO\4_2025-06-23.md'
Converted 'data\edgar_documents\AVGO\4_2025-06-25' --> 'data\processed_data\AVGO\4_2025-06-25.md'


2025-11-14 15:38:28,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:28,754 - INFO - Going to convert document batch...
2025-11-14 15:38:28,756 - INFO - Processing document 4_2025-06-26
2025-11-14 15:38:28,794 - INFO - Finished converting document 4_2025-06-26 in 0.12 sec.
2025-11-14 15:38:28,866 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:28,923 - INFO - Going to convert document batch...
2025-11-14 15:38:28,927 - INFO - Processing document 4_2025-06-27
2025-11-14 15:38:29,014 - INFO - Finished converting document 4_2025-06-27 in 0.17 sec.


Converted 'data\edgar_documents\AVGO\4_2025-06-26' --> 'data\processed_data\AVGO\4_2025-06-26.md'


2025-11-14 15:38:29,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:29,164 - INFO - Going to convert document batch...
2025-11-14 15:38:29,165 - INFO - Processing document 4_2025-06-30
2025-11-14 15:38:29,235 - INFO - Finished converting document 4_2025-06-30 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2025-06-27' --> 'data\processed_data\AVGO\4_2025-06-27.md'
Converted 'data\edgar_documents\AVGO\4_2025-06-30' --> 'data\processed_data\AVGO\4_2025-06-30.md'


2025-11-14 15:38:29,362 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:29,364 - ERROR - Input document 4_2025-07-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:29,367 - INFO - Going to convert document batch...
2025-11-14 15:38:29,416 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:29,417 - ERROR - Input document 4_2025-07-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AVGO\4_2025-07-07: File format not allowed: data\edgar_documents\AVGO\4_2025-07-07
Error processing data\edgar_documents\AVGO\4_2025-07-09: File format not allowed: data\edgar_documents\AVGO\4_2025-07-09
Converted 'data\edgar_documents\AVGO\4_2025-07-11' --> 'data\processed_data\AVGO\4_2025-07-11.md'


2025-11-14 15:38:29,577 - INFO - Going to convert document batch...
2025-11-14 15:38:29,578 - INFO - Processing document 4_2025-07-16
2025-11-14 15:38:29,616 - INFO - Finished converting document 4_2025-07-16 in 0.08 sec.
2025-11-14 15:38:29,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:29,690 - INFO - Going to convert document batch...
2025-11-14 15:38:29,694 - INFO - Processing document 4_2025-08-15
2025-11-14 15:38:29,741 - INFO - Finished converting document 4_2025-08-15 in 0.08 sec.
2025-11-14 15:38:29,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-07-16' --> 'data\processed_data\AVGO\4_2025-07-16.md'
Converted 'data\edgar_documents\AVGO\4_2025-08-15' --> 'data\processed_data\AVGO\4_2025-08-15.md'


2025-11-14 15:38:29,861 - INFO - Going to convert document batch...
2025-11-14 15:38:29,864 - INFO - Processing document 4_2025-09-10
2025-11-14 15:38:29,951 - INFO - Finished converting document 4_2025-09-10 in 0.16 sec.
2025-11-14 15:38:30,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:30,062 - INFO - Going to convert document batch...
2025-11-14 15:38:30,064 - INFO - Processing document 4_2025-09-12
2025-11-14 15:38:30,148 - INFO - Finished converting document 4_2025-09-12 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2025-09-10' --> 'data\processed_data\AVGO\4_2025-09-10.md'
Converted 'data\edgar_documents\AVGO\4_2025-09-12' --> 'data\processed_data\AVGO\4_2025-09-12.md'


2025-11-14 15:38:30,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:30,266 - INFO - Going to convert document batch...
2025-11-14 15:38:30,268 - INFO - Processing document 4_2025-09-15
2025-11-14 15:38:30,390 - INFO - Finished converting document 4_2025-09-15 in 0.17 sec.
2025-11-14 15:38:30,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:30,507 - INFO - Going to convert document batch...
2025-11-14 15:38:30,508 - INFO - Processing document 4_2025-09-17
2025-11-14 15:38:30,550 - INFO - Finished converting document 4_2025-09-17 in 0.08 sec.
2025-11-14 15:38:30,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-09-15' --> 'data\processed_data\AVGO\4_2025-09-15.md'
Converted 'data\edgar_documents\AVGO\4_2025-09-17' --> 'data\processed_data\AVGO\4_2025-09-17.md'


2025-11-14 15:38:30,697 - INFO - Going to convert document batch...
2025-11-14 15:38:30,698 - INFO - Processing document 4_2025-09-18
2025-11-14 15:38:30,844 - INFO - Finished converting document 4_2025-09-18 in 0.25 sec.
2025-11-14 15:38:30,988 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:30,989 - ERROR - Input document 4_2025-09-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:30,991 - INFO - Going to convert document batch...
2025-11-14 15:38:31,016 - IN

Converted 'data\edgar_documents\AVGO\4_2025-09-18' --> 'data\processed_data\AVGO\4_2025-09-18.md'
Error processing data\edgar_documents\AVGO\4_2025-09-22: File format not allowed: data\edgar_documents\AVGO\4_2025-09-22
Error processing data\edgar_documents\AVGO\4_2025-09-24: File format not allowed: data\edgar_documents\AVGO\4_2025-09-24


2025-11-14 15:38:31,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:31,238 - INFO - Going to convert document batch...
2025-11-14 15:38:31,240 - INFO - Processing document 4_2025-09-26
2025-11-14 15:38:31,342 - INFO - Finished converting document 4_2025-09-26 in 0.17 sec.


Converted 'data\edgar_documents\AVGO\4_2025-09-25' --> 'data\processed_data\AVGO\4_2025-09-25.md'


2025-11-14 15:38:31,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:31,489 - INFO - Going to convert document batch...
2025-11-14 15:38:31,491 - INFO - Processing document 4_2025-10-16


Converted 'data\edgar_documents\AVGO\4_2025-09-26' --> 'data\processed_data\AVGO\4_2025-09-26.md'


2025-11-14 15:38:31,662 - INFO - Finished converting document 4_2025-10-16 in 0.22 sec.
2025-11-14 15:38:31,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:31,788 - INFO - Going to convert document batch...
2025-11-14 15:38:31,789 - INFO - Processing document 8-K_2023-03-02
2025-11-14 15:38:31,856 - INFO - Finished converting document 8-K_2023-03-02 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2025-10-16' --> 'data\processed_data\AVGO\4_2025-10-16.md'


2025-11-14 15:38:31,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,024 - INFO - Going to convert document batch...
2025-11-14 15:38:32,026 - INFO - Processing document 8-K_2023-04-06
2025-11-14 15:38:32,110 - INFO - Finished converting document 8-K_2023-04-06 in 0.19 sec.


Converted 'data\edgar_documents\AVGO\8-K_2023-03-02' --> 'data\processed_data\AVGO\8-K_2023-03-02.md'


2025-11-14 15:38:32,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,186 - INFO - Going to convert document batch...
2025-11-14 15:38:32,188 - INFO - Processing document 8-K_2023-05-23
2025-11-14 15:38:32,231 - INFO - Finished converting document 8-K_2023-05-23 in 0.09 sec.
2025-11-14 15:38:32,274 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,317 - INFO - Going to convert document batch...
2025-11-14 15:38:32,319 - INFO - Processing document 8-K_2023-06-01


Converted 'data\edgar_documents\AVGO\8-K_2023-04-06' --> 'data\processed_data\AVGO\8-K_2023-04-06.md'
Converted 'data\edgar_documents\AVGO\8-K_2023-05-23' --> 'data\processed_data\AVGO\8-K_2023-05-23.md'


2025-11-14 15:38:32,408 - INFO - Finished converting document 8-K_2023-06-01 in 0.14 sec.
2025-11-14 15:38:32,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,552 - INFO - Going to convert document batch...
2025-11-14 15:38:32,554 - INFO - Processing document 8-K_2023-08-16
2025-11-14 15:38:32,610 - INFO - Finished converting document 8-K_2023-08-16 in 0.14 sec.


Converted 'data\edgar_documents\AVGO\8-K_2023-06-01' --> 'data\processed_data\AVGO\8-K_2023-06-01.md'
Converted 'data\edgar_documents\AVGO\8-K_2023-08-16' --> 'data\processed_data\AVGO\8-K_2023-08-16.md'


2025-11-14 15:38:32,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,728 - INFO - Going to convert document batch...
2025-11-14 15:38:32,730 - INFO - Processing document 8-K_2023-08-31
2025-11-14 15:38:32,823 - INFO - Finished converting document 8-K_2023-08-31 in 0.19 sec.
2025-11-14 15:38:32,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,936 - INFO - Going to convert document batch...
2025-11-14 15:38:32,938 - INFO - Processing document 8-K_2023-10-18
2025-11-14 15:38:32,986 - INFO - Finished converting document 8-K_2023-10-18 in 0.11 sec.
2025-11-14 15:38:33,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\8-K_2023-08-31' --> 'data\processed_data\AVGO\8-K_2023-08-31.md'
Converted 'data\edgar_documents\AVGO\8-K_2023-10-18' --> 'data\processed_data\AVGO\8-K_2023-10-18.md'


2025-11-14 15:38:33,065 - INFO - Going to convert document batch...
2025-11-14 15:38:33,069 - INFO - Processing document 8-K_2023-10-30
2025-11-14 15:38:33,143 - INFO - Finished converting document 8-K_2023-10-30 in 0.12 sec.
2025-11-14 15:38:33,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:33,250 - INFO - Going to convert document batch...
2025-11-14 15:38:33,252 - INFO - Processing document 8-K_2023-11-22
2025-11-14 15:38:33,315 - INFO - Finished converting document 8-K_2023-11-22 in 0.14 sec.


Converted 'data\edgar_documents\AVGO\8-K_2023-10-30' --> 'data\processed_data\AVGO\8-K_2023-10-30.md'


2025-11-14 15:38:33,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:33,439 - INFO - Going to convert document batch...
2025-11-14 15:38:33,441 - INFO - Processing document 8-K_2023-12-07
2025-11-14 15:38:33,537 - INFO - Finished converting document 8-K_2023-12-07 in 0.17 sec.


Converted 'data\edgar_documents\AVGO\8-K_2023-11-22' --> 'data\processed_data\AVGO\8-K_2023-11-22.md'


2025-11-14 15:38:33,595 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:33,596 - ERROR - Input document 8-K_2024-02-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:33,598 - INFO - Going to convert document batch...
2025-11-14 15:38:33,616 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:33,618 - ERROR - Input document 8-K_2024-02-09 with format None does 

Converted 'data\edgar_documents\AVGO\8-K_2023-12-07' --> 'data\processed_data\AVGO\8-K_2023-12-07.md'
Error processing data\edgar_documents\AVGO\8-K_2024-02-08: File format not allowed: data\edgar_documents\AVGO\8-K_2024-02-08
Error processing data\edgar_documents\AVGO\8-K_2024-02-09: File format not allowed: data\edgar_documents\AVGO\8-K_2024-02-09


2025-11-14 15:38:33,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:33,890 - INFO - Going to convert document batch...
2025-11-14 15:38:33,892 - INFO - Processing document 8-K_2024-04-24


Converted 'data\edgar_documents\AVGO\8-K_2024-03-07' --> 'data\processed_data\AVGO\8-K_2024-03-07.md'


2025-11-14 15:38:34,010 - INFO - Finished converting document 8-K_2024-04-24 in 0.23 sec.
2025-11-14 15:38:34,086 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,120 - INFO - Going to convert document batch...
2025-11-14 15:38:34,122 - INFO - Processing document 8-K_2024-06-12
2025-11-14 15:38:34,195 - INFO - Finished converting document 8-K_2024-06-12 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\8-K_2024-04-24' --> 'data\processed_data\AVGO\8-K_2024-04-24.md'
Converted 'data\edgar_documents\AVGO\8-K_2024-06-12' --> 'data\processed_data\AVGO\8-K_2024-06-12.md'


2025-11-14 15:38:34,280 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:34,281 - ERROR - Input document 8-K_2024-07-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:34,284 - INFO - Going to convert document batch...
2025-11-14 15:38:34,308 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:34,309 - ERROR - Input document 8-K_2024-07-12 with format None does 

Error processing data\edgar_documents\AVGO\8-K_2024-07-08: File format not allowed: data\edgar_documents\AVGO\8-K_2024-07-08
Error processing data\edgar_documents\AVGO\8-K_2024-07-12: File format not allowed: data\edgar_documents\AVGO\8-K_2024-07-12


2025-11-14 15:38:34,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,551 - INFO - Going to convert document batch...
2025-11-14 15:38:34,553 - INFO - Processing document 8-K_2024-10-02
2025-11-14 15:38:34,605 - INFO - Finished converting document 8-K_2024-10-02 in 0.11 sec.
2025-11-14 15:38:34,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,682 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AVGO\8-K_2024-09-05' --> 'data\processed_data\AVGO\8-K_2024-09-05.md'
Converted 'data\edgar_documents\AVGO\8-K_2024-10-02' --> 'data\processed_data\AVGO\8-K_2024-10-02.md'


2025-11-14 15:38:34,683 - INFO - Processing document 8-K_2024-12-12
2025-11-14 15:38:34,746 - INFO - Finished converting document 8-K_2024-12-12 in 0.12 sec.
2025-11-14 15:38:34,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,825 - INFO - Going to convert document batch...
2025-11-14 15:38:34,826 - INFO - Processing document 8-K_2025-01-10
2025-11-14 15:38:34,864 - INFO - Finished converting document 8-K_2025-01-10 in 0.08 sec.
2025-11-14 15:38:34,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,928 - INFO - Going to convert document batch...
2025-11-14 15:38:34,929 - INFO - Processing document 8-K_2025-01-13


Converted 'data\edgar_documents\AVGO\8-K_2024-12-12' --> 'data\processed_data\AVGO\8-K_2024-12-12.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-01-10' --> 'data\processed_data\AVGO\8-K_2025-01-10.md'


2025-11-14 15:38:35,480 - INFO - Finished converting document 8-K_2025-01-13 in 0.59 sec.
2025-11-14 15:38:35,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:35,547 - INFO - Going to convert document batch...
2025-11-14 15:38:35,549 - INFO - Processing document 8-K_2025-03-06
2025-11-14 15:38:35,630 - INFO - Finished converting document 8-K_2025-03-06 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\8-K_2025-01-13' --> 'data\processed_data\AVGO\8-K_2025-01-13.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-03-06' --> 'data\processed_data\AVGO\8-K_2025-03-06.md'


2025-11-14 15:38:35,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:35,767 - INFO - Going to convert document batch...
2025-11-14 15:38:35,768 - INFO - Processing document 8-K_2025-04-22
2025-11-14 15:38:35,849 - INFO - Finished converting document 8-K_2025-04-22 in 0.17 sec.
2025-11-14 15:38:35,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:35,971 - INFO - Going to convert document batch...
2025-11-14 15:38:35,973 - INFO - Processing document 8-K_2025-06-05
2025-11-14 15:38:36,034 - INFO - Finished converting document 8-K_2025-06-05 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\8-K_2025-04-22' --> 'data\processed_data\AVGO\8-K_2025-04-22.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-06-05' --> 'data\processed_data\AVGO\8-K_2025-06-05.md'


2025-11-14 15:38:36,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,173 - INFO - Going to convert document batch...
2025-11-14 15:38:36,176 - INFO - Processing document 8-K_2025-07-11
2025-11-14 15:38:36,234 - INFO - Finished converting document 8-K_2025-07-11 in 0.14 sec.
2025-11-14 15:38:36,276 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,299 - INFO - Going to convert document batch...
2025-11-14 15:38:36,300 - INFO - Processing document 8-K_2025-09-04
2025-11-14 15:38:36,350 - INFO - Finished converting document 8-K_2025-09-04 in 0.08 sec.
2025-11-14 15:38:36,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,462 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AVGO\8-K_2025-07-11' --> 'data\processed_data\AVGO\8-K_2025-07-11.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-09-04' --> 'data\processed_data\AVGO\8-K_2025-09-04.md'


2025-11-14 15:38:36,465 - INFO - Processing document 8-K_2025-09-09
2025-11-14 15:38:36,516 - INFO - Finished converting document 8-K_2025-09-09 in 0.14 sec.
2025-11-14 15:38:36,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,607 - INFO - Going to convert document batch...
2025-11-14 15:38:36,610 - INFO - Processing document 8-K_2025-09-10
2025-11-14 15:38:36,649 - INFO - Finished converting document 8-K_2025-09-10 in 0.09 sec.
2025-11-14 15:38:36,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,740 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AVGO\8-K_2025-09-09' --> 'data\processed_data\AVGO\8-K_2025-09-09.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-09-10' --> 'data\processed_data\AVGO\8-K_2025-09-10.md'


2025-11-14 15:38:36,741 - INFO - Processing document 8-K_2025-09-29
2025-11-14 15:38:36,796 - INFO - Finished converting document 8-K_2025-09-29 in 0.14 sec.
2025-11-14 15:38:36,869 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:36,871 - ERROR - Input document DEF-14A_2023-02-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:36,874 - INFO - Going to convert document batch...
2025-11-14 15:38:36,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\8-K_2025-09-29' --> 'data\processed_data\AVGO\8-K_2025-09-29.md'
Error processing data\edgar_documents\AVGO\DEF-14A_2023-02-17: File format not allowed: data\edgar_documents\AVGO\DEF-14A_2023-02-17


2025-11-14 15:38:37,777 - INFO - Going to convert document batch...
2025-11-14 15:38:37,778 - INFO - Processing document DEF-14A_2024-02-26
2025-11-14 15:38:42,627 - INFO - Finished converting document DEF-14A_2024-02-26 in 5.75 sec.
2025-11-14 15:38:44,075 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:44,077 - ERROR - Input document DEF-14A_2025-03-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:44,082 - INFO - Going to 

Converted 'data\edgar_documents\AVGO\DEF-14A_2024-02-26' --> 'data\processed_data\AVGO\DEF-14A_2024-02-26.md'
Error processing data\edgar_documents\AVGO\DEF-14A_2025-03-03: File format not allowed: data\edgar_documents\AVGO\DEF-14A_2025-03-03
Processed 123 new files. Errors: 33
Found 169 files to process in data\edgar_documents\AXP


2025-11-14 15:38:44,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:47,369 - INFO - Going to convert document batch...
2025-11-14 15:38:47,371 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:38:47,372 - INFO - Processing document 10-K_2023-02-10
2025-11-14 15:38:55,893 - INFO - Finished converting document 10-K_2023-02-10 in 11.78 sec.
2025-11-14 15:38:58,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-K_2023-02-10' --> 'data\processed_data\AXP\10-K_2023-02-10.md'


2025-11-14 15:39:02,351 - INFO - Going to convert document batch...
2025-11-14 15:39:02,353 - INFO - Processing document 10-K_2024-02-09
2025-11-14 15:39:10,848 - INFO - Finished converting document 10-K_2024-02-09 in 12.24 sec.
2025-11-14 15:39:14,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-K_2024-02-09' --> 'data\processed_data\AXP\10-K_2024-02-09.md'


2025-11-14 15:39:18,675 - INFO - Going to convert document batch...
2025-11-14 15:39:18,677 - INFO - Processing document 10-K_2025-02-07
2025-11-14 15:39:25,623 - INFO - Finished converting document 10-K_2025-02-07 in 10.98 sec.
2025-11-14 15:39:28,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-K_2025-02-07' --> 'data\processed_data\AXP\10-K_2025-02-07.md'


2025-11-14 15:39:30,140 - INFO - Going to convert document batch...
2025-11-14 15:39:30,141 - INFO - Processing document 10-Q_2023-04-21
2025-11-14 15:39:33,239 - INFO - Finished converting document 10-Q_2023-04-21 in 4.75 sec.
2025-11-14 15:39:34,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2023-04-21' --> 'data\processed_data\AXP\10-Q_2023-04-21.md'


2025-11-14 15:39:37,886 - INFO - Going to convert document batch...
2025-11-14 15:39:37,888 - INFO - Processing document 10-Q_2023-07-25
2025-11-14 15:39:42,121 - INFO - Finished converting document 10-Q_2023-07-25 in 7.58 sec.
2025-11-14 15:39:44,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2023-07-25' --> 'data\processed_data\AXP\10-Q_2023-07-25.md'


2025-11-14 15:39:46,556 - INFO - Going to convert document batch...
2025-11-14 15:39:46,558 - INFO - Processing document 10-Q_2023-10-20
2025-11-14 15:39:50,003 - INFO - Finished converting document 10-Q_2023-10-20 in 6.03 sec.
2025-11-14 15:39:52,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2023-10-20' --> 'data\processed_data\AXP\10-Q_2023-10-20.md'


2025-11-14 15:39:54,173 - INFO - Going to convert document batch...
2025-11-14 15:39:54,174 - INFO - Processing document 10-Q_2024-04-19
2025-11-14 15:39:57,332 - INFO - Finished converting document 10-Q_2024-04-19 in 4.69 sec.
2025-11-14 15:39:58,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2024-04-19' --> 'data\processed_data\AXP\10-Q_2024-04-19.md'


2025-11-14 15:40:00,586 - INFO - Going to convert document batch...
2025-11-14 15:40:00,587 - INFO - Processing document 10-Q_2024-07-19
2025-11-14 15:40:02,024 - INFO - Finished converting document 10-Q_2024-07-19 in 3.28 sec.
2025-11-14 15:40:02,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2024-07-19' --> 'data\processed_data\AXP\10-Q_2024-07-19.md'


2025-11-14 15:40:03,648 - INFO - Going to convert document batch...
2025-11-14 15:40:03,649 - INFO - Processing document 10-Q_2024-10-18
2025-11-14 15:40:05,149 - INFO - Finished converting document 10-Q_2024-10-18 in 2.52 sec.
2025-11-14 15:40:05,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2024-10-18' --> 'data\processed_data\AXP\10-Q_2024-10-18.md'


2025-11-14 15:40:06,881 - INFO - Going to convert document batch...
2025-11-14 15:40:06,881 - INFO - Processing document 10-Q_2025-04-18
2025-11-14 15:40:08,114 - INFO - Finished converting document 10-Q_2025-04-18 in 2.30 sec.
2025-11-14 15:40:08,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2025-04-18' --> 'data\processed_data\AXP\10-Q_2025-04-18.md'


2025-11-14 15:40:09,964 - INFO - Going to convert document batch...
2025-11-14 15:40:09,965 - INFO - Processing document 10-Q_2025-07-18
2025-11-14 15:40:11,501 - INFO - Finished converting document 10-Q_2025-07-18 in 2.80 sec.
2025-11-14 15:40:12,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2025-07-18' --> 'data\processed_data\AXP\10-Q_2025-07-18.md'


2025-11-14 15:40:13,335 - INFO - Going to convert document batch...
2025-11-14 15:40:13,336 - INFO - Processing document 10-Q_2025-10-17
2025-11-14 15:40:16,724 - INFO - Finished converting document 10-Q_2025-10-17 in 4.52 sec.
2025-11-14 15:40:18,478 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:18,508 - INFO - Going to convert document batch...
2025-11-14 15:40:18,509 - INFO - Processing document 4_2023-01-04
2025-11-14 15:40:18,557 - INFO - Finished converting document 4_2023-01-04 in 0.12 sec.
2025-11-14 15:40:18,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2025-10-17' --> 'data\processed_data\AXP\10-Q_2025-10-17.md'
Converted 'data\edgar_documents\AXP\4_2023-01-04' --> 'data\processed_data\AXP\4_2023-01-04.md'


2025-11-14 15:40:18,664 - INFO - Going to convert document batch...
2025-11-14 15:40:18,666 - INFO - Processing document 4_2023-01-31
2025-11-14 15:40:18,731 - INFO - Finished converting document 4_2023-01-31 in 0.12 sec.
2025-11-14 15:40:18,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:18,848 - INFO - Going to convert document batch...
2025-11-14 15:40:18,849 - INFO - Processing document 4_2023-02-01
2025-11-14 15:40:18,956 - INFO - Finished converting document 4_2023-02-01 in 0.16 sec.


Converted 'data\edgar_documents\AXP\4_2023-01-31' --> 'data\processed_data\AXP\4_2023-01-31.md'


2025-11-14 15:40:19,042 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:19,043 - ERROR - Input document 4_2023-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:19,046 - INFO - Going to convert document batch...
2025-11-14 15:40:19,069 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:19,070 - ERROR - Input document 4_2023-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\AXP\4_2023-02-01' --> 'data\processed_data\AXP\4_2023-02-01.md'
Error processing data\edgar_documents\AXP\4_2023-02-13: File format not allowed: data\edgar_documents\AXP\4_2023-02-13
Error processing data\edgar_documents\AXP\4_2023-02-14: File format not allowed: data\edgar_documents\AXP\4_2023-02-14
Converted 'data\edgar_documents\AXP\4_2023-02-16' --> 'data\processed_data\AXP\4_2023-02-16.md'


2025-11-14 15:40:19,231 - INFO - Going to convert document batch...
2025-11-14 15:40:19,232 - INFO - Processing document 4_2023-02-21
2025-11-14 15:40:19,285 - INFO - Finished converting document 4_2023-02-21 in 0.09 sec.
2025-11-14 15:40:19,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:19,355 - INFO - Going to convert document batch...
2025-11-14 15:40:19,356 - INFO - Processing document 4_2023-03-06
2025-11-14 15:40:19,390 - INFO - Finished converting document 4_2023-03-06 in 0.06 sec.
2025-11-14 15:40:19,454 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:19,474 - INFO - Going to convert document batch...
2025-11-14 15:40:19,475 - INFO - Processing document 4_2023-03-10


Converted 'data\edgar_documents\AXP\4_2023-02-21' --> 'data\processed_data\AXP\4_2023-02-21.md'
Converted 'data\edgar_documents\AXP\4_2023-03-06' --> 'data\processed_data\AXP\4_2023-03-06.md'


2025-11-14 15:40:19,521 - INFO - Finished converting document 4_2023-03-10 in 0.09 sec.
2025-11-14 15:40:19,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:19,597 - INFO - Going to convert document batch...
2025-11-14 15:40:19,598 - INFO - Processing document 4_2023-04-04
2025-11-14 15:40:19,642 - INFO - Finished converting document 4_2023-04-04 in 0.08 sec.


Converted 'data\edgar_documents\AXP\4_2023-03-10' --> 'data\processed_data\AXP\4_2023-03-10.md'
Converted 'data\edgar_documents\AXP\4_2023-04-04' --> 'data\processed_data\AXP\4_2023-04-04.md'


2025-11-14 15:40:19,762 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:19,764 - ERROR - Input document 4_2023-04-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:19,766 - INFO - Going to convert document batch...
2025-11-14 15:40:19,807 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:19,808 - ERROR - Input document 4_2023-04-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AXP\4_2023-04-26: File format not allowed: data\edgar_documents\AXP\4_2023-04-26
Error processing data\edgar_documents\AXP\4_2023-04-27: File format not allowed: data\edgar_documents\AXP\4_2023-04-27
Converted 'data\edgar_documents\AXP\4_2023-05-02' --> 'data\processed_data\AXP\4_2023-05-02.md'


2025-11-14 15:40:19,995 - INFO - Going to convert document batch...
2025-11-14 15:40:19,997 - INFO - Processing document 4_2023-05-04
2025-11-14 15:40:20,040 - INFO - Finished converting document 4_2023-05-04 in 0.08 sec.
2025-11-14 15:40:20,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:20,138 - INFO - Going to convert document batch...
2025-11-14 15:40:20,139 - INFO - Processing document 4_2023-05-22
2025-11-14 15:40:20,182 - INFO - Finished converting document 4_2023-05-22 in 0.09 sec.
2025-11-14 15:40:20,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:20,258 - INFO - Going to convert document batch...
2025-11-14 15:40:20,259 - INFO - Processing document 4_2023-07-05


Converted 'data\edgar_documents\AXP\4_2023-05-04' --> 'data\processed_data\AXP\4_2023-05-04.md'
Converted 'data\edgar_documents\AXP\4_2023-05-22' --> 'data\processed_data\AXP\4_2023-05-22.md'


2025-11-14 15:40:20,303 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 15:40:20,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:20,399 - INFO - Going to convert document batch...
2025-11-14 15:40:20,400 - INFO - Processing document 4_2023-07-11
2025-11-14 15:40:20,474 - INFO - Finished converting document 4_2023-07-11 in 0.11 sec.


Converted 'data\edgar_documents\AXP\4_2023-07-05' --> 'data\processed_data\AXP\4_2023-07-05.md'
Converted 'data\edgar_documents\AXP\4_2023-07-11' --> 'data\processed_data\AXP\4_2023-07-11.md'


2025-11-14 15:40:20,597 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:20,598 - ERROR - Input document 4_2023-07-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:20,600 - INFO - Going to convert document batch...
2025-11-14 15:40:20,627 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:20,628 - ERROR - Input document 4_2023-07-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AXP\4_2023-07-25: File format not allowed: data\edgar_documents\AXP\4_2023-07-25
Error processing data\edgar_documents\AXP\4_2023-07-27: File format not allowed: data\edgar_documents\AXP\4_2023-07-27
Converted 'data\edgar_documents\AXP\4_2023-08-01' --> 'data\processed_data\AXP\4_2023-08-01.md'


2025-11-14 15:40:20,786 - INFO - Processing document 4_2023-10-03
2025-11-14 15:40:20,843 - INFO - Finished converting document 4_2023-10-03 in 0.09 sec.
2025-11-14 15:40:20,934 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:20,935 - ERROR - Input document 4_2023-10-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:20,937 - INFO - Going to convert document batch...
2025-11-14 15:40:20,959 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\AXP\4_2023-10-03' --> 'data\processed_data\AXP\4_2023-10-03.md'
Error processing data\edgar_documents\AXP\4_2023-10-24: File format not allowed: data\edgar_documents\AXP\4_2023-10-24
Error processing data\edgar_documents\AXP\4_2023-10-25: File format not allowed: data\edgar_documents\AXP\4_2023-10-25


2025-11-14 15:40:21,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,129 - INFO - Going to convert document batch...
2025-11-14 15:40:21,130 - INFO - Processing document 4_2023-11-30
2025-11-14 15:40:21,171 - INFO - Finished converting document 4_2023-11-30 in 0.08 sec.
2025-11-14 15:40:21,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,256 - INFO - Going to convert document batch...
2025-11-14 15:40:21,258 - INFO - Processing document 4_2024-01-03


Converted 'data\edgar_documents\AXP\4_2023-11-17' --> 'data\processed_data\AXP\4_2023-11-17.md'
Converted 'data\edgar_documents\AXP\4_2023-11-30' --> 'data\processed_data\AXP\4_2023-11-30.md'


2025-11-14 15:40:21,303 - INFO - Finished converting document 4_2024-01-03 in 0.08 sec.
2025-11-14 15:40:21,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,383 - INFO - Going to convert document batch...
2025-11-14 15:40:21,384 - INFO - Processing document 4_2024-01-30
2025-11-14 15:40:21,425 - INFO - Finished converting document 4_2024-01-30 in 0.08 sec.
2025-11-14 15:40:21,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,542 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AXP\4_2024-01-03' --> 'data\processed_data\AXP\4_2024-01-03.md'
Converted 'data\edgar_documents\AXP\4_2024-01-30' --> 'data\processed_data\AXP\4_2024-01-30.md'


2025-11-14 15:40:21,544 - INFO - Processing document 4_2024-01-31
2025-11-14 15:40:21,630 - INFO - Finished converting document 4_2024-01-31 in 0.16 sec.
2025-11-14 15:40:21,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,709 - INFO - Going to convert document batch...
2025-11-14 15:40:21,711 - INFO - Processing document 4_2024-02-05
2025-11-14 15:40:21,756 - INFO - Finished converting document 4_2024-02-05 in 0.06 sec.
2025-11-14 15:40:21,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,836 - INFO - Going to convert document batch...
2025-11-14 15:40:21,838 - INFO - Processing document 4_2024-02-12


Converted 'data\edgar_documents\AXP\4_2024-01-31' --> 'data\processed_data\AXP\4_2024-01-31.md'
Converted 'data\edgar_documents\AXP\4_2024-02-05' --> 'data\processed_data\AXP\4_2024-02-05.md'


2025-11-14 15:40:21,890 - INFO - Finished converting document 4_2024-02-12 in 0.09 sec.
2025-11-14 15:40:21,982 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:21,983 - ERROR - Input document 4_2024-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:21,988 - INFO - Going to convert document batch...
2025-11-14 15:40:22,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,043 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\AXP\4_2024-02-12' --> 'data\processed_data\AXP\4_2024-02-12.md'
Error processing data\edgar_documents\AXP\4_2024-02-13: File format not allowed: data\edgar_documents\AXP\4_2024-02-13
Converted 'data\edgar_documents\AXP\4_2024-02-14' --> 'data\processed_data\AXP\4_2024-02-14.md'


2025-11-14 15:40:22,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,183 - INFO - Going to convert document batch...
2025-11-14 15:40:22,185 - INFO - Processing document 4_2024-02-22
2025-11-14 15:40:22,231 - INFO - Finished converting document 4_2024-02-22 in 0.09 sec.
2025-11-14 15:40:22,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,333 - INFO - Going to convert document batch...
2025-11-14 15:40:22,335 - INFO - Processing document 4_2024-03-04
2025-11-14 15:40:22,398 - INFO - Finished converting document 4_2024-03-04 in 0.11 sec.
2025-11-14 15:40:22,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,483 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AXP\4_2024-02-22' --> 'data\processed_data\AXP\4_2024-02-22.md'
Converted 'data\edgar_documents\AXP\4_2024-03-04' --> 'data\processed_data\AXP\4_2024-03-04.md'


2025-11-14 15:40:22,484 - INFO - Processing document 4_2024-03-11
2025-11-14 15:40:22,542 - INFO - Finished converting document 4_2024-03-11 in 0.11 sec.
2025-11-14 15:40:22,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,612 - INFO - Going to convert document batch...
2025-11-14 15:40:22,614 - INFO - Processing document 4_2024-04-02
2025-11-14 15:40:22,652 - INFO - Finished converting document 4_2024-04-02 in 0.08 sec.
2025-11-14 15:40:22,723 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:22,724 - ERROR - Input document 4_2024-04-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\AXP\4_2024-03-11' --> 'data\processed_data\AXP\4_2024-03-11.md'
Converted 'data\edgar_documents\AXP\4_2024-04-02' --> 'data\processed_data\AXP\4_2024-04-02.md'
Error processing data\edgar_documents\AXP\4_2024-04-23: File format not allowed: data\edgar_documents\AXP\4_2024-04-23


2025-11-14 15:40:22,769 - INFO - Going to convert document batch...
2025-11-14 15:40:22,771 - INFO - Processing document 4_2024-04-25
2025-11-14 15:40:22,818 - INFO - Finished converting document 4_2024-04-25 in 0.09 sec.
2025-11-14 15:40:22,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,893 - INFO - Going to convert document batch...
2025-11-14 15:40:22,894 - INFO - Processing document 4_2024-05-02
2025-11-14 15:40:22,952 - INFO - Finished converting document 4_2024-05-02 in 0.09 sec.
2025-11-14 15:40:23,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2024-04-25' --> 'data\processed_data\AXP\4_2024-04-25.md'
Converted 'data\edgar_documents\AXP\4_2024-05-02' --> 'data\processed_data\AXP\4_2024-05-02.md'


2025-11-14 15:40:23,061 - INFO - Going to convert document batch...
2025-11-14 15:40:23,063 - INFO - Processing document 4_2024-05-06
2025-11-14 15:40:23,124 - INFO - Finished converting document 4_2024-05-06 in 0.11 sec.
2025-11-14 15:40:23,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,200 - INFO - Going to convert document batch...
2025-11-14 15:40:23,202 - INFO - Processing document 4_2024-05-07
2025-11-14 15:40:23,245 - INFO - Finished converting document 4_2024-05-07 in 0.08 sec.
2025-11-14 15:40:23,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,318 - INFO - Going to convert document batch...
2025-11-14 15:40:23,320 - INFO - Processing document 4_2024-05-08


Converted 'data\edgar_documents\AXP\4_2024-05-06' --> 'data\processed_data\AXP\4_2024-05-06.md'
Converted 'data\edgar_documents\AXP\4_2024-05-07' --> 'data\processed_data\AXP\4_2024-05-07.md'


2025-11-14 15:40:23,369 - INFO - Finished converting document 4_2024-05-08 in 0.08 sec.
2025-11-14 15:40:23,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,514 - INFO - Going to convert document batch...
2025-11-14 15:40:23,517 - INFO - Processing document 4_2024-05-13
2025-11-14 15:40:23,610 - INFO - Finished converting document 4_2024-05-13 in 0.19 sec.


Converted 'data\edgar_documents\AXP\4_2024-05-08' --> 'data\processed_data\AXP\4_2024-05-08.md'


2025-11-14 15:40:23,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,805 - INFO - Going to convert document batch...
2025-11-14 15:40:23,807 - INFO - Processing document 4_2024-05-21
2025-11-14 15:40:23,860 - INFO - Finished converting document 4_2024-05-21 in 0.20 sec.


Converted 'data\edgar_documents\AXP\4_2024-05-13' --> 'data\processed_data\AXP\4_2024-05-13.md'


2025-11-14 15:40:23,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,984 - INFO - Going to convert document batch...
2025-11-14 15:40:23,985 - INFO - Processing document 4_2024-05-23
2025-11-14 15:40:24,032 - INFO - Finished converting document 4_2024-05-23 in 0.12 sec.
2025-11-14 15:40:24,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2024-05-21' --> 'data\processed_data\AXP\4_2024-05-21.md'
Converted 'data\edgar_documents\AXP\4_2024-05-23' --> 'data\processed_data\AXP\4_2024-05-23.md'


2025-11-14 15:40:24,122 - INFO - Going to convert document batch...
2025-11-14 15:40:24,123 - INFO - Processing document 4_2024-06-17
2025-11-14 15:40:24,161 - INFO - Finished converting document 4_2024-06-17 in 0.06 sec.
2025-11-14 15:40:24,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,231 - INFO - Going to convert document batch...
2025-11-14 15:40:24,232 - INFO - Processing document 4_2024-07-02
2025-11-14 15:40:24,272 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.
2025-11-14 15:40:24,376 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:24,379 - ERROR - Input document 4_2024-07-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\AXP\4_2024-06-17' --> 'data\processed_data\AXP\4_2024-06-17.md'
Converted 'data\edgar_documents\AXP\4_2024-07-02' --> 'data\processed_data\AXP\4_2024-07-02.md'


2025-11-14 15:40:24,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,430 - INFO - Going to convert document batch...
2025-11-14 15:40:24,433 - INFO - Processing document 4_2024-10-02
2025-11-14 15:40:24,487 - INFO - Finished converting document 4_2024-10-02 in 0.09 sec.


Error processing data\edgar_documents\AXP\4_2024-07-23: File format not allowed: data\edgar_documents\AXP\4_2024-07-23
Converted 'data\edgar_documents\AXP\4_2024-10-02' --> 'data\processed_data\AXP\4_2024-10-02.md'


2025-11-14 15:40:24,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,650 - INFO - Going to convert document batch...
2025-11-14 15:40:24,651 - INFO - Processing document 4_2024-10-24
2025-11-14 15:40:24,725 - INFO - Finished converting document 4_2024-10-24 in 0.17 sec.
2025-11-14 15:40:24,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,825 - INFO - Going to convert document batch...
2025-11-14 15:40:24,827 - INFO - Processing document 4_2024-10-31
2025-11-14 15:40:24,875 - INFO - Finished converting document 4_2024-10-31 in 0.11 sec.


Converted 'data\edgar_documents\AXP\4_2024-10-24' --> 'data\processed_data\AXP\4_2024-10-24.md'
Converted 'data\edgar_documents\AXP\4_2024-10-31' --> 'data\processed_data\AXP\4_2024-10-31.md'


2025-11-14 15:40:24,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,991 - INFO - Going to convert document batch...
2025-11-14 15:40:24,993 - INFO - Processing document 4_2024-11-08
2025-11-14 15:40:25,039 - INFO - Finished converting document 4_2024-11-08 in 0.09 sec.
2025-11-14 15:40:25,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:25,136 - INFO - Going to convert document batch...
2025-11-14 15:40:25,138 - INFO - Processing document 4_2024-11-12
2025-11-14 15:40:25,210 - INFO - Finished converting document 4_2024-11-12 in 0.12 sec.
2025-11-14 15:40:25,274 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2024-11-08' --> 'data\processed_data\AXP\4_2024-11-08.md'
Converted 'data\edgar_documents\AXP\4_2024-11-12' --> 'data\processed_data\AXP\4_2024-11-12.md'


2025-11-14 15:40:25,295 - INFO - Going to convert document batch...
2025-11-14 15:40:25,298 - INFO - Processing document 4_2024-11-25
2025-11-14 15:40:25,337 - INFO - Finished converting document 4_2024-11-25 in 0.06 sec.
2025-11-14 15:40:25,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:25,413 - INFO - Going to convert document batch...
2025-11-14 15:40:25,414 - INFO - Processing document 4_2024-12-02
2025-11-14 15:40:25,458 - INFO - Finished converting document 4_2024-12-02 in 0.08 sec.
2025-11-14 15:40:25,560 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2024-11-25' --> 'data\processed_data\AXP\4_2024-11-25.md'
Converted 'data\edgar_documents\AXP\4_2024-12-02' --> 'data\processed_data\AXP\4_2024-12-02.md'


2025-11-14 15:40:25,603 - INFO - Going to convert document batch...
2025-11-14 15:40:25,609 - INFO - Processing document 4_2025-01-03
2025-11-14 15:40:25,672 - INFO - Finished converting document 4_2025-01-03 in 0.14 sec.
2025-11-14 15:40:25,738 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:25,739 - ERROR - Input document 4_2025-01-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:25,740 - INFO - Going to convert document batch...
2025-11-14 15:40:25,763 - IN

Converted 'data\edgar_documents\AXP\4_2025-01-03' --> 'data\processed_data\AXP\4_2025-01-03.md'
Error processing data\edgar_documents\AXP\4_2025-01-29: File format not allowed: data\edgar_documents\AXP\4_2025-01-29


2025-11-14 15:40:25,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:25,999 - INFO - Going to convert document batch...
2025-11-14 15:40:26,002 - INFO - Processing document 4_2025-02-06
2025-11-14 15:40:26,056 - INFO - Finished converting document 4_2025-02-06 in 0.12 sec.


Converted 'data\edgar_documents\AXP\4_2025-01-30' --> 'data\processed_data\AXP\4_2025-01-30.md'


2025-11-14 15:40:26,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:26,186 - INFO - Going to convert document batch...
2025-11-14 15:40:26,187 - INFO - Processing document 4_2025-02-10
2025-11-14 15:40:26,235 - INFO - Finished converting document 4_2025-02-10 in 0.11 sec.
2025-11-14 15:40:26,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2025-02-06' --> 'data\processed_data\AXP\4_2025-02-06.md'
Converted 'data\edgar_documents\AXP\4_2025-02-10' --> 'data\processed_data\AXP\4_2025-02-10.md'


2025-11-14 15:40:26,328 - INFO - Going to convert document batch...
2025-11-14 15:40:26,331 - INFO - Processing document 4_2025-02-13
2025-11-14 15:40:26,378 - INFO - Finished converting document 4_2025-02-13 in 0.09 sec.
2025-11-14 15:40:26,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:26,485 - INFO - Going to convert document batch...
2025-11-14 15:40:26,487 - INFO - Processing document 4_2025-02-28
2025-11-14 15:40:26,552 - INFO - Finished converting document 4_2025-02-28 in 0.12 sec.
2025-11-14 15:40:26,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2025-02-13' --> 'data\processed_data\AXP\4_2025-02-13.md'
Converted 'data\edgar_documents\AXP\4_2025-02-28' --> 'data\processed_data\AXP\4_2025-02-28.md'


2025-11-14 15:40:26,632 - INFO - Going to convert document batch...
2025-11-14 15:40:26,633 - INFO - Processing document 4_2025-03-06
2025-11-14 15:40:26,693 - INFO - Finished converting document 4_2025-03-06 in 0.09 sec.
2025-11-14 15:40:26,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:26,813 - INFO - Going to convert document batch...
2025-11-14 15:40:26,814 - INFO - Processing document 4_2025-03-11
2025-11-14 15:40:26,882 - INFO - Finished converting document 4_2025-03-11 in 0.09 sec.
2025-11-14 15:40:26,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2025-03-06' --> 'data\processed_data\AXP\4_2025-03-06.md'
Converted 'data\edgar_documents\AXP\4_2025-03-11' --> 'data\processed_data\AXP\4_2025-03-11.md'


2025-11-14 15:40:26,993 - INFO - Going to convert document batch...
2025-11-14 15:40:26,995 - INFO - Processing document 4_2025-04-02
2025-11-14 15:40:27,041 - INFO - Finished converting document 4_2025-04-02 in 0.09 sec.
2025-11-14 15:40:27,109 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:27,111 - ERROR - Input document 4_2025-04-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:27,112 - INFO - Going to convert document batch...
2025-11-14 15:40:27,128 - IN

Converted 'data\edgar_documents\AXP\4_2025-04-02' --> 'data\processed_data\AXP\4_2025-04-02.md'
Error processing data\edgar_documents\AXP\4_2025-04-22: File format not allowed: data\edgar_documents\AXP\4_2025-04-22
Converted 'data\edgar_documents\AXP\4_2025-04-30' --> 'data\processed_data\AXP\4_2025-04-30.md'


2025-11-14 15:40:27,265 - INFO - Going to convert document batch...
2025-11-14 15:40:27,268 - INFO - Processing document 4_2025-05-01
2025-11-14 15:40:27,315 - INFO - Finished converting document 4_2025-05-01 in 0.08 sec.
2025-11-14 15:40:27,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:27,409 - INFO - Going to convert document batch...
2025-11-14 15:40:27,410 - INFO - Processing document 4_2025-05-07
2025-11-14 15:40:27,457 - INFO - Finished converting document 4_2025-05-07 in 0.09 sec.
2025-11-14 15:40:27,554 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\AXP\4_2025-05-01' --> 'data\processed_data\AXP\4_2025-05-01.md'
Converted 'data\edgar_documents\AXP\4_2025-05-07' --> 'data\processed_data\AXP\4_2025-05-07.md'


2025-11-14 15:40:27,555 - ERROR - Input document 4_2025-05-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:27,558 - INFO - Going to convert document batch...
2025-11-14 15:40:27,590 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:27,591 - ERROR - Input document 4_2025-05-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\AXP\4_2025-05-13: File format not allowed: data\edgar_documents\AXP\4_2025-05-13
Error processing data\edgar_documents\AXP\4_2025-05-14: File format not allowed: data\edgar_documents\AXP\4_2025-05-14
Converted 'data\edgar_documents\AXP\4_2025-05-21' --> 'data\processed_data\AXP\4_2025-05-21.md'


2025-11-14 15:40:27,862 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:27,863 - ERROR - Input document 4_2025-07-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:27,866 - INFO - Going to convert document batch...
2025-11-14 15:40:27,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:27,923 - INFO - Going to convert document batch...
2025-11-14 15:40:27,924 - INFO - Processing document 4_2025-07-31
2025-11-14 15:40:27,985 - INFO - Fin

Converted 'data\edgar_documents\AXP\4_2025-07-02' --> 'data\processed_data\AXP\4_2025-07-02.md'
Error processing data\edgar_documents\AXP\4_2025-07-22: File format not allowed: data\edgar_documents\AXP\4_2025-07-22


2025-11-14 15:40:28,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:28,129 - INFO - Going to convert document batch...
2025-11-14 15:40:28,133 - INFO - Processing document 4_2025-08-07
2025-11-14 15:40:28,220 - INFO - Finished converting document 4_2025-08-07 in 0.16 sec.


Converted 'data\edgar_documents\AXP\4_2025-07-31' --> 'data\processed_data\AXP\4_2025-07-31.md'


2025-11-14 15:40:28,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:28,346 - INFO - Going to convert document batch...
2025-11-14 15:40:28,347 - INFO - Processing document 4_2025-09-04
2025-11-14 15:40:28,423 - INFO - Finished converting document 4_2025-09-04 in 0.12 sec.


Converted 'data\edgar_documents\AXP\4_2025-08-07' --> 'data\processed_data\AXP\4_2025-08-07.md'
Converted 'data\edgar_documents\AXP\4_2025-09-04' --> 'data\processed_data\AXP\4_2025-09-04.md'


2025-11-14 15:40:28,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:28,556 - INFO - Going to convert document batch...
2025-11-14 15:40:28,558 - INFO - Processing document 4_2025-09-05
2025-11-14 15:40:28,714 - INFO - Finished converting document 4_2025-09-05 in 0.22 sec.
2025-11-14 15:40:28,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:28,832 - INFO - Going to convert document batch...
2025-11-14 15:40:28,833 - INFO - Processing document 4_2025-09-08
2025-11-14 15:40:28,902 - INFO - Finished converting document 4_2025-09-08 in 0.12 sec.


Converted 'data\edgar_documents\AXP\4_2025-09-05' --> 'data\processed_data\AXP\4_2025-09-05.md'
Converted 'data\edgar_documents\AXP\4_2025-09-08' --> 'data\processed_data\AXP\4_2025-09-08.md'


2025-11-14 15:40:28,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:29,009 - INFO - Going to convert document batch...
2025-11-14 15:40:29,011 - INFO - Processing document 4_2025-10-02
2025-11-14 15:40:29,057 - INFO - Finished converting document 4_2025-10-02 in 0.11 sec.
2025-11-14 15:40:29,163 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:29,164 - ERROR - Input document 4_2025-10-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40

Converted 'data\edgar_documents\AXP\4_2025-10-02' --> 'data\processed_data\AXP\4_2025-10-02.md'
Error processing data\edgar_documents\AXP\4_2025-10-21: File format not allowed: data\edgar_documents\AXP\4_2025-10-21


2025-11-14 15:40:29,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:29,337 - INFO - Going to convert document batch...
2025-11-14 15:40:29,339 - INFO - Processing document 4_2025-10-24
2025-11-14 15:40:29,393 - INFO - Finished converting document 4_2025-10-24 in 0.09 sec.
2025-11-14 15:40:29,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2025-10-23' --> 'data\processed_data\AXP\4_2025-10-23.md'
Converted 'data\edgar_documents\AXP\4_2025-10-24' --> 'data\processed_data\AXP\4_2025-10-24.md'


2025-11-14 15:40:29,505 - INFO - Going to convert document batch...
2025-11-14 15:40:29,507 - INFO - Processing document 4_2025-11-04
2025-11-14 15:40:29,560 - INFO - Finished converting document 4_2025-11-04 in 0.11 sec.
2025-11-14 15:40:29,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:29,698 - INFO - Going to convert document batch...
2025-11-14 15:40:29,700 - INFO - Processing document 8-K_2023-01-17
2025-11-14 15:40:29,782 - INFO - Finished converting document 8-K_2023-01-17 in 0.17 sec.


Converted 'data\edgar_documents\AXP\4_2025-11-04' --> 'data\processed_data\AXP\4_2025-11-04.md'
Converted 'data\edgar_documents\AXP\8-K_2023-01-17' --> 'data\processed_data\AXP\8-K_2023-01-17.md'


2025-11-14 15:40:29,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:29,882 - INFO - Going to convert document batch...
2025-11-14 15:40:29,883 - INFO - Processing document 8-K_2023-01-27
2025-11-14 15:40:29,924 - INFO - Finished converting document 8-K_2023-01-27 in 0.11 sec.
2025-11-14 15:40:29,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,006 - INFO - Going to convert document batch...
2025-11-14 15:40:30,009 - INFO - Processing document 8-K_2023-02-15
2025-11-14 15:40:30,088 - INFO - Finished converting document 8-K_2023-02-15 in 0.16 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-01-27' --> 'data\processed_data\AXP\8-K_2023-01-27.md'
Converted 'data\edgar_documents\AXP\8-K_2023-02-15' --> 'data\processed_data\AXP\8-K_2023-02-15.md'


2025-11-14 15:40:30,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,190 - INFO - Going to convert document batch...
2025-11-14 15:40:30,192 - INFO - Processing document 8-K_2023-02-16
2025-11-14 15:40:30,236 - INFO - Finished converting document 8-K_2023-02-16 in 0.11 sec.
2025-11-14 15:40:30,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,303 - INFO - Going to convert document batch...
2025-11-14 15:40:30,304 - INFO - Processing document 8-K_2023-03-08
2025-11-14 15:40:30,339 - INFO - Finished converting document 8-K_2023-03-08 in 0.09 sec.
2025-11-14 15:40:30,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,434 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AXP\8-K_2023-02-16' --> 'data\processed_data\AXP\8-K_2023-02-16.md'
Converted 'data\edgar_documents\AXP\8-K_2023-03-08' --> 'data\processed_data\AXP\8-K_2023-03-08.md'


2025-11-14 15:40:30,436 - INFO - Processing document 8-K_2023-03-15
2025-11-14 15:40:30,527 - INFO - Finished converting document 8-K_2023-03-15 in 0.17 sec.
2025-11-14 15:40:30,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,639 - INFO - Going to convert document batch...
2025-11-14 15:40:30,640 - INFO - Processing document 8-K_2023-04-17
2025-11-14 15:40:30,716 - INFO - Finished converting document 8-K_2023-04-17 in 0.16 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-03-15' --> 'data\processed_data\AXP\8-K_2023-03-15.md'
Converted 'data\edgar_documents\AXP\8-K_2023-04-17' --> 'data\processed_data\AXP\8-K_2023-04-17.md'


2025-11-14 15:40:30,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,808 - INFO - Going to convert document batch...
2025-11-14 15:40:30,810 - INFO - Processing document 8-K_2023-04-20
2025-11-14 15:40:30,845 - INFO - Finished converting document 8-K_2023-04-20 in 0.09 sec.
2025-11-14 15:40:30,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,913 - INFO - Going to convert document batch...
2025-11-14 15:40:30,914 - INFO - Processing document 8-K_2023-05-01
2025-11-14 15:40:30,955 - INFO - Finished converting document 8-K_2023-05-01 in 0.09 sec.
2025-11-14 15:40:30,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:31,050 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AXP\8-K_2023-04-20' --> 'data\processed_data\AXP\8-K_2023-04-20.md'
Converted 'data\edgar_documents\AXP\8-K_2023-05-01' --> 'data\processed_data\AXP\8-K_2023-05-01.md'


2025-11-14 15:40:31,051 - INFO - Processing document 8-K_2023-05-05
2025-11-14 15:40:31,166 - INFO - Finished converting document 8-K_2023-05-05 in 0.20 sec.
2025-11-14 15:40:31,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:31,292 - INFO - Going to convert document batch...
2025-11-14 15:40:31,293 - INFO - Processing document 8-K_2023-05-15
2025-11-14 15:40:31,367 - INFO - Finished converting document 8-K_2023-05-15 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-05-05' --> 'data\processed_data\AXP\8-K_2023-05-05.md'


2025-11-14 15:40:31,422 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2023-05-15' --> 'data\processed_data\AXP\8-K_2023-05-15.md'


2025-11-14 15:40:32,685 - INFO - Going to convert document batch...
2025-11-14 15:40:32,686 - INFO - Processing document 8-K_2023-06-15
2025-11-14 15:40:32,755 - INFO - Finished converting document 8-K_2023-06-15 in 1.34 sec.
2025-11-14 15:40:32,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:32,826 - INFO - Going to convert document batch...
2025-11-14 15:40:32,828 - INFO - Processing document 8-K_2023-06-27
2025-11-14 15:40:32,860 - INFO - Finished converting document 8-K_2023-06-27 in 0.08 sec.
2025-11-14 15:40:32,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2023-06-15' --> 'data\processed_data\AXP\8-K_2023-06-15.md'
Converted 'data\edgar_documents\AXP\8-K_2023-06-27' --> 'data\processed_data\AXP\8-K_2023-06-27.md'


2025-11-14 15:40:32,982 - INFO - Going to convert document batch...
2025-11-14 15:40:32,983 - INFO - Processing document 8-K_2023-07-17
2025-11-14 15:40:33,067 - INFO - Finished converting document 8-K_2023-07-17 in 0.19 sec.
2025-11-14 15:40:33,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,147 - INFO - Going to convert document batch...
2025-11-14 15:40:33,148 - INFO - Processing document 8-K_2023-07-21
2025-11-14 15:40:33,177 - INFO - Finished converting document 8-K_2023-07-21 in 0.06 sec.
2025-11-14 15:40:33,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,258 - INFO - Going to convert document batch...
2025-11-14 15:40:33,260 - INFO - Processing document 8-K_2023-07-28
2025-11-14 15:40:33,320 - INFO - Finished converting document 8-K_2023-07-28 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-07-17' --> 'data\processed_data\AXP\8-K_2023-07-17.md'
Converted 'data\edgar_documents\AXP\8-K_2023-07-21' --> 'data\processed_data\AXP\8-K_2023-07-21.md'


2025-11-14 15:40:33,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,443 - INFO - Going to convert document batch...
2025-11-14 15:40:33,445 - INFO - Processing document 8-K_2023-08-15
2025-11-14 15:40:33,530 - INFO - Finished converting document 8-K_2023-08-15 in 0.19 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-07-28' --> 'data\processed_data\AXP\8-K_2023-07-28.md'


2025-11-14 15:40:33,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,633 - INFO - Going to convert document batch...
2025-11-14 15:40:33,633 - INFO - Processing document 8-K_2023-09-15
2025-11-14 15:40:33,699 - INFO - Finished converting document 8-K_2023-09-15 in 0.14 sec.
2025-11-14 15:40:33,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2023-08-15' --> 'data\processed_data\AXP\8-K_2023-08-15.md'
Converted 'data\edgar_documents\AXP\8-K_2023-09-15' --> 'data\processed_data\AXP\8-K_2023-09-15.md'


2025-11-14 15:40:33,793 - INFO - Going to convert document batch...
2025-11-14 15:40:33,795 - INFO - Processing document 8-K_2023-10-16
2025-11-14 15:40:33,866 - INFO - Finished converting document 8-K_2023-10-16 in 0.14 sec.
2025-11-14 15:40:33,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,981 - INFO - Going to convert document batch...
2025-11-14 15:40:33,983 - INFO - Processing document 8-K_2023-10-20
2025-11-14 15:40:34,043 - INFO - Finished converting document 8-K_2023-10-20 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-10-16' --> 'data\processed_data\AXP\8-K_2023-10-16.md'
Converted 'data\edgar_documents\AXP\8-K_2023-10-20' --> 'data\processed_data\AXP\8-K_2023-10-20.md'


2025-11-14 15:40:34,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,149 - INFO - Going to convert document batch...
2025-11-14 15:40:34,150 - INFO - Processing document 8-K_2023-10-30
2025-11-14 15:40:34,206 - INFO - Finished converting document 8-K_2023-10-30 in 0.14 sec.
2025-11-14 15:40:34,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,327 - INFO - Going to convert document batch...
2025-11-14 15:40:34,331 - INFO - Processing document 8-K_2023-11-15
2025-11-14 15:40:34,420 - INFO - Finished converting document 8-K_2023-11-15 in 0.19 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-10-30' --> 'data\processed_data\AXP\8-K_2023-10-30.md'


2025-11-14 15:40:34,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,552 - INFO - Going to convert document batch...
2025-11-14 15:40:34,553 - INFO - Processing document 8-K_2023-12-15


Converted 'data\edgar_documents\AXP\8-K_2023-11-15' --> 'data\processed_data\AXP\8-K_2023-11-15.md'


2025-11-14 15:40:34,665 - INFO - Finished converting document 8-K_2023-12-15 in 0.19 sec.
2025-11-14 15:40:34,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,775 - INFO - Going to convert document batch...
2025-11-14 15:40:34,777 - INFO - Processing document 8-K_2024-01-16
2025-11-14 15:40:34,843 - INFO - Finished converting document 8-K_2024-01-16 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-12-15' --> 'data\processed_data\AXP\8-K_2023-12-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-01-16' --> 'data\processed_data\AXP\8-K_2024-01-16.md'


2025-11-14 15:40:34,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,952 - INFO - Going to convert document batch...
2025-11-14 15:40:34,954 - INFO - Processing document 8-K_2024-01-26
2025-11-14 15:40:35,010 - INFO - Finished converting document 8-K_2024-01-26 in 0.16 sec.
2025-11-14 15:40:35,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,100 - INFO - Going to convert document batch...
2025-11-14 15:40:35,101 - INFO - Processing document 8-K_2024-02-15
2025-11-14 15:40:35,182 - INFO - Finished converting document 8-K_2024-02-15 in 0.16 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-01-26' --> 'data\processed_data\AXP\8-K_2024-01-26.md'


2025-11-14 15:40:35,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,295 - INFO - Going to convert document batch...
2025-11-14 15:40:35,297 - INFO - Processing document 8-K_2024-02-16
2025-11-14 15:40:35,340 - INFO - Finished converting document 8-K_2024-02-16 in 0.11 sec.
2025-11-14 15:40:35,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,403 - INFO - Going to convert document batch...
2025-11-14 15:40:35,404 - INFO - Processing document 8-K_2024-03-07
2025-11-14 15:40:35,435 - INFO - Finished converting document 8-K_2024-03-07 in 0.08 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-02-15' --> 'data\processed_data\AXP\8-K_2024-02-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-02-16' --> 'data\processed_data\AXP\8-K_2024-02-16.md'


2025-11-14 15:40:35,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,502 - INFO - Going to convert document batch...
2025-11-14 15:40:35,502 - INFO - Processing document 8-K_2024-03-15
2025-11-14 15:40:35,563 - INFO - Finished converting document 8-K_2024-03-15 in 0.11 sec.
2025-11-14 15:40:35,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2024-03-07' --> 'data\processed_data\AXP\8-K_2024-03-07.md'
Converted 'data\edgar_documents\AXP\8-K_2024-03-15' --> 'data\processed_data\AXP\8-K_2024-03-15.md'


2025-11-14 15:40:35,699 - INFO - Going to convert document batch...
2025-11-14 15:40:35,701 - INFO - Processing document 8-K_2024-04-15
2025-11-14 15:40:35,852 - INFO - Finished converting document 8-K_2024-04-15 in 0.24 sec.
2025-11-14 15:40:35,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,962 - INFO - Going to convert document batch...
2025-11-14 15:40:35,964 - INFO - Processing document 8-K_2024-04-19
2025-11-14 15:40:36,049 - INFO - Finished converting document 8-K_2024-04-19 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-04-15' --> 'data\processed_data\AXP\8-K_2024-04-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-04-19' --> 'data\processed_data\AXP\8-K_2024-04-19.md'


2025-11-14 15:40:36,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:36,174 - INFO - Going to convert document batch...
2025-11-14 15:40:36,176 - INFO - Processing document 8-K_2024-04-25
2025-11-14 15:40:36,244 - INFO - Finished converting document 8-K_2024-04-25 in 0.12 sec.
2025-11-14 15:40:36,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:36,349 - INFO - Going to convert document batch...
2025-11-14 15:40:36,349 - INFO - Processing document 8-K_2024-05-08


Converted 'data\edgar_documents\AXP\8-K_2024-04-25' --> 'data\processed_data\AXP\8-K_2024-04-25.md'


2025-11-14 15:40:36,574 - INFO - Finished converting document 8-K_2024-05-08 in 0.33 sec.
2025-11-14 15:40:36,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:36,739 - INFO - Going to convert document batch...
2025-11-14 15:40:36,741 - INFO - Processing document 8-K_2024-05-15
2025-11-14 15:40:36,817 - INFO - Finished converting document 8-K_2024-05-15 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-05-08' --> 'data\processed_data\AXP\8-K_2024-05-08.md'
Converted 'data\edgar_documents\AXP\8-K_2024-05-15' --> 'data\processed_data\AXP\8-K_2024-05-15.md'


2025-11-14 15:40:36,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:36,937 - INFO - Going to convert document batch...
2025-11-14 15:40:36,939 - INFO - Processing document 8-K_2024-06-17
2025-11-14 15:40:37,021 - INFO - Finished converting document 8-K_2024-06-17 in 0.17 sec.
2025-11-14 15:40:37,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:37,179 - INFO - Going to convert document batch...
2025-11-14 15:40:37,181 - INFO - Processing document 8-K_2024-07-15


Converted 'data\edgar_documents\AXP\8-K_2024-06-17' --> 'data\processed_data\AXP\8-K_2024-06-17.md'


2025-11-14 15:40:37,299 - INFO - Finished converting document 8-K_2024-07-15 in 0.22 sec.
2025-11-14 15:40:37,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:37,413 - INFO - Going to convert document batch...
2025-11-14 15:40:37,414 - INFO - Processing document 8-K_2024-07-19
2025-11-14 15:40:37,460 - INFO - Finished converting document 8-K_2024-07-19 in 0.11 sec.
2025-11-14 15:40:37,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2024-07-15' --> 'data\processed_data\AXP\8-K_2024-07-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-07-19' --> 'data\processed_data\AXP\8-K_2024-07-19.md'


2025-11-14 15:40:37,545 - INFO - Going to convert document batch...
2025-11-14 15:40:37,549 - INFO - Processing document 8-K_2024-07-26
2025-11-14 15:40:37,627 - INFO - Finished converting document 8-K_2024-07-26 in 0.16 sec.
2025-11-14 15:40:37,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:37,729 - INFO - Going to convert document batch...
2025-11-14 15:40:37,731 - INFO - Processing document 8-K_2024-08-15
2025-11-14 15:40:37,839 - INFO - Finished converting document 8-K_2024-08-15 in 0.19 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-07-26' --> 'data\processed_data\AXP\8-K_2024-07-26.md'


2025-11-14 15:40:37,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:37,967 - INFO - Going to convert document batch...
2025-11-14 15:40:37,968 - INFO - Processing document 8-K_2024-09-16
2025-11-14 15:40:38,042 - INFO - Finished converting document 8-K_2024-09-16 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-08-15' --> 'data\processed_data\AXP\8-K_2024-08-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-09-16' --> 'data\processed_data\AXP\8-K_2024-09-16.md'


2025-11-14 15:40:38,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,133 - INFO - Going to convert document batch...
2025-11-14 15:40:38,134 - INFO - Processing document 8-K_2024-09-27
2025-11-14 15:40:38,171 - INFO - Finished converting document 8-K_2024-09-27 in 0.09 sec.
2025-11-14 15:40:38,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,241 - INFO - Going to convert document batch...
2025-11-14 15:40:38,244 - INFO - Processing document 8-K_2024-10-15
2025-11-14 15:40:38,319 - INFO - Finished converting document 8-K_2024-10-15 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-09-27' --> 'data\processed_data\AXP\8-K_2024-09-27.md'
Converted 'data\edgar_documents\AXP\8-K_2024-10-15' --> 'data\processed_data\AXP\8-K_2024-10-15.md'


2025-11-14 15:40:38,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,422 - INFO - Going to convert document batch...
2025-11-14 15:40:38,424 - INFO - Processing document 8-K_2024-10-18
2025-11-14 15:40:38,470 - INFO - Finished converting document 8-K_2024-10-18 in 0.11 sec.
2025-11-14 15:40:38,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,551 - INFO - Going to convert document batch...
2025-11-14 15:40:38,552 - INFO - Processing document 8-K_2024-11-15


Converted 'data\edgar_documents\AXP\8-K_2024-10-18' --> 'data\processed_data\AXP\8-K_2024-10-18.md'


2025-11-14 15:40:38,697 - INFO - Finished converting document 8-K_2024-11-15 in 0.20 sec.
2025-11-14 15:40:38,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,806 - INFO - Going to convert document batch...
2025-11-14 15:40:38,808 - INFO - Processing document 8-K_2024-12-16
2025-11-14 15:40:38,893 - INFO - Finished converting document 8-K_2024-12-16 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-11-15' --> 'data\processed_data\AXP\8-K_2024-11-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-12-16' --> 'data\processed_data\AXP\8-K_2024-12-16.md'


2025-11-14 15:40:38,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,069 - INFO - Going to convert document batch...
2025-11-14 15:40:39,070 - INFO - Processing document 8-K_2025-01-15
2025-11-14 15:40:39,208 - INFO - Finished converting document 8-K_2025-01-15 in 0.25 sec.
2025-11-14 15:40:39,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,327 - INFO - Going to convert document batch...
2025-11-14 15:40:39,328 - INFO - Processing document 8-K_2025-01-16
2025-11-14 15:40:39,374 - INFO - Finished converting document 8-K_2025-01-16 in 0.09 sec.
2025-11-14 15:40:39,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,453 - INFO - Going to convert document batch...
2025-11-14 15:40:39,454 - INFO - Processing document 8-K_2025-01-24


Converted 'data\edgar_documents\AXP\8-K_2025-01-15' --> 'data\processed_data\AXP\8-K_2025-01-15.md'
Converted 'data\edgar_documents\AXP\8-K_2025-01-16' --> 'data\processed_data\AXP\8-K_2025-01-16.md'


2025-11-14 15:40:39,511 - INFO - Finished converting document 8-K_2025-01-24 in 0.12 sec.
2025-11-14 15:40:39,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,577 - INFO - Going to convert document batch...
2025-11-14 15:40:39,578 - INFO - Processing document 8-K_2025-01-30
2025-11-14 15:40:39,614 - INFO - Finished converting document 8-K_2025-01-30 in 0.08 sec.
2025-11-14 15:40:39,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,696 - INFO - Going to convert document batch...
2025-11-14 15:40:39,697 - INFO - Processing document 8-K_2025-02-18


Converted 'data\edgar_documents\AXP\8-K_2025-01-24' --> 'data\processed_data\AXP\8-K_2025-01-24.md'
Converted 'data\edgar_documents\AXP\8-K_2025-01-30' --> 'data\processed_data\AXP\8-K_2025-01-30.md'


2025-11-14 15:40:39,837 - INFO - Finished converting document 8-K_2025-02-18 in 0.20 sec.
2025-11-14 15:40:39,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,967 - INFO - Going to convert document batch...
2025-11-14 15:40:39,968 - INFO - Processing document 8-K_2025-03-03
2025-11-14 15:40:40,025 - INFO - Finished converting document 8-K_2025-03-03 in 0.12 sec.
2025-11-14 15:40:40,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2025-02-18' --> 'data\processed_data\AXP\8-K_2025-02-18.md'
Converted 'data\edgar_documents\AXP\8-K_2025-03-03' --> 'data\processed_data\AXP\8-K_2025-03-03.md'


2025-11-14 15:40:40,157 - INFO - Going to convert document batch...
2025-11-14 15:40:40,159 - INFO - Processing document 8-K_2025-03-17
2025-11-14 15:40:40,227 - INFO - Finished converting document 8-K_2025-03-17 in 0.17 sec.
2025-11-14 15:40:40,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:40,303 - INFO - Going to convert document batch...
2025-11-14 15:40:40,304 - INFO - Processing document 8-K_2025-04-15


Converted 'data\edgar_documents\AXP\8-K_2025-03-17' --> 'data\processed_data\AXP\8-K_2025-03-17.md'


2025-11-14 15:40:40,886 - INFO - Finished converting document 8-K_2025-04-15 in 0.64 sec.
2025-11-14 15:40:40,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,033 - INFO - Going to convert document batch...
2025-11-14 15:40:41,035 - INFO - Processing document 8-K_2025-04-17
2025-11-14 15:40:41,085 - INFO - Finished converting document 8-K_2025-04-17 in 0.11 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-04-15' --> 'data\processed_data\AXP\8-K_2025-04-15.md'
Converted 'data\edgar_documents\AXP\8-K_2025-04-17' --> 'data\processed_data\AXP\8-K_2025-04-17.md'


2025-11-14 15:40:41,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,199 - INFO - Going to convert document batch...
2025-11-14 15:40:41,201 - INFO - Processing document 8-K_2025-04-25
2025-11-14 15:40:41,267 - INFO - Finished converting document 8-K_2025-04-25 in 0.14 sec.
2025-11-14 15:40:41,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,383 - INFO - Going to convert document batch...
2025-11-14 15:40:41,384 - INFO - Processing document 8-K_2025-05-01


Converted 'data\edgar_documents\AXP\8-K_2025-04-25' --> 'data\processed_data\AXP\8-K_2025-04-25.md'


2025-11-14 15:40:41,526 - INFO - Finished converting document 8-K_2025-05-01 in 0.23 sec.
2025-11-14 15:40:41,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,668 - INFO - Going to convert document batch...
2025-11-14 15:40:41,668 - INFO - Processing document 8-K_2025-05-15
2025-11-14 15:40:41,741 - INFO - Finished converting document 8-K_2025-05-15 in 0.14 sec.
2025-11-14 15:40:41,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2025-05-01' --> 'data\processed_data\AXP\8-K_2025-05-01.md'
Converted 'data\edgar_documents\AXP\8-K_2025-05-15' --> 'data\processed_data\AXP\8-K_2025-05-15.md'


2025-11-14 15:40:41,811 - INFO - Going to convert document batch...
2025-11-14 15:40:41,812 - INFO - Processing document 8-K_2025-05-20
2025-11-14 15:40:41,844 - INFO - Finished converting document 8-K_2025-05-20 in 0.08 sec.
2025-11-14 15:40:41,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,905 - INFO - Going to convert document batch...
2025-11-14 15:40:41,906 - INFO - Processing document 8-K_2025-06-16
2025-11-14 15:40:41,951 - INFO - Finished converting document 8-K_2025-06-16 in 0.09 sec.
2025-11-14 15:40:42,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2025-05-20' --> 'data\processed_data\AXP\8-K_2025-05-20.md'
Converted 'data\edgar_documents\AXP\8-K_2025-06-16' --> 'data\processed_data\AXP\8-K_2025-06-16.md'


2025-11-14 15:40:42,089 - INFO - Going to convert document batch...
2025-11-14 15:40:42,093 - INFO - Processing document 8-K_2025-07-01
2025-11-14 15:40:42,170 - INFO - Finished converting document 8-K_2025-07-01 in 0.17 sec.
2025-11-14 15:40:42,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,259 - INFO - Going to convert document batch...
2025-11-14 15:40:42,261 - INFO - Processing document 8-K_2025-07-15
2025-11-14 15:40:42,382 - INFO - Finished converting document 8-K_2025-07-15 in 0.19 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-07-01' --> 'data\processed_data\AXP\8-K_2025-07-01.md'


2025-11-14 15:40:42,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,518 - INFO - Going to convert document batch...
2025-11-14 15:40:42,521 - INFO - Processing document 8-K_2025-07-18
2025-11-14 15:40:42,596 - INFO - Finished converting document 8-K_2025-07-18 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-07-15' --> 'data\processed_data\AXP\8-K_2025-07-15.md'
Converted 'data\edgar_documents\AXP\8-K_2025-07-18' --> 'data\processed_data\AXP\8-K_2025-07-18.md'


2025-11-14 15:40:42,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,692 - INFO - Going to convert document batch...
2025-11-14 15:40:42,693 - INFO - Processing document 8-K_2025-07-23
2025-11-14 15:40:42,724 - INFO - Finished converting document 8-K_2025-07-23 in 0.08 sec.
2025-11-14 15:40:42,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,784 - INFO - Going to convert document batch...
2025-11-14 15:40:42,786 - INFO - Processing document 8-K_2025-07-25
2025-11-14 15:40:42,826 - INFO - Finished converting document 8-K_2025-07-25 in 0.09 sec.
2025-11-14 15:40:42,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,915 - INFO - Going to convert document batch...
2025-11-14 15:40:42,916 - INFO - Processing document 8-K_2025-08-15


Converted 'data\edgar_documents\AXP\8-K_2025-07-23' --> 'data\processed_data\AXP\8-K_2025-07-23.md'
Converted 'data\edgar_documents\AXP\8-K_2025-07-25' --> 'data\processed_data\AXP\8-K_2025-07-25.md'


2025-11-14 15:40:42,978 - INFO - Finished converting document 8-K_2025-08-15 in 0.12 sec.
2025-11-14 15:40:43,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:43,059 - INFO - Going to convert document batch...
2025-11-14 15:40:43,060 - INFO - Processing document 8-K_2025-09-15
2025-11-14 15:40:43,133 - INFO - Finished converting document 8-K_2025-09-15 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-08-15' --> 'data\processed_data\AXP\8-K_2025-08-15.md'
Converted 'data\edgar_documents\AXP\8-K_2025-09-15' --> 'data\processed_data\AXP\8-K_2025-09-15.md'


2025-11-14 15:40:43,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:43,223 - INFO - Going to convert document batch...
2025-11-14 15:40:43,224 - INFO - Processing document 8-K_2025-09-29
2025-11-14 15:40:43,259 - INFO - Finished converting document 8-K_2025-09-29 in 0.08 sec.
2025-11-14 15:40:43,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:43,330 - INFO - Going to convert document batch...
2025-11-14 15:40:43,331 - INFO - Processing document 8-K_2025-10-15
2025-11-14 15:40:43,405 - INFO - Finished converting document 8-K_2025-10-15 in 0.12 sec.
2025-11-14 15:40:43,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2025-09-29' --> 'data\processed_data\AXP\8-K_2025-09-29.md'
Converted 'data\edgar_documents\AXP\8-K_2025-10-15' --> 'data\processed_data\AXP\8-K_2025-10-15.md'


2025-11-14 15:40:43,499 - INFO - Going to convert document batch...
2025-11-14 15:40:43,500 - INFO - Processing document 8-K_2025-10-17
2025-11-14 15:40:43,538 - INFO - Finished converting document 8-K_2025-10-17 in 0.09 sec.
2025-11-14 15:40:43,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:43,591 - INFO - Going to convert document batch...
2025-11-14 15:40:43,593 - INFO - Processing document 8-K_2025-10-24
2025-11-14 15:40:43,636 - INFO - Finished converting document 8-K_2025-10-24 in 0.08 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-10-17' --> 'data\processed_data\AXP\8-K_2025-10-17.md'
Converted 'data\edgar_documents\AXP\8-K_2025-10-24' --> 'data\processed_data\AXP\8-K_2025-10-24.md'


2025-11-14 15:40:43,743 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:43,743 - ERROR - Input document DEF-14A_2023-03-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:43,747 - INFO - Going to convert document batch...
2025-11-14 15:40:43,800 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:43,800 - ERROR - Input document DEF-14A_2024-03-15 with format No

Error processing data\edgar_documents\AXP\DEF-14A_2023-03-17: File format not allowed: data\edgar_documents\AXP\DEF-14A_2023-03-17
Error processing data\edgar_documents\AXP\DEF-14A_2024-03-15: File format not allowed: data\edgar_documents\AXP\DEF-14A_2024-03-15
Error processing data\edgar_documents\AXP\DEF-14A_2025-03-14: File format not allowed: data\edgar_documents\AXP\DEF-14A_2025-03-14
Processed 149 new files. Errors: 20
Found 106 files to process in data\edgar_documents\BA


2025-11-14 15:40:44,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:46,485 - INFO - Going to convert document batch...
2025-11-14 15:40:46,486 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:40:46,487 - INFO - Processing document 10-K_2023-01-27
2025-11-14 15:40:52,229 - INFO - Finished converting document 10-K_2023-01-27 in 8.36 sec.
2025-11-14 15:40:54,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-K_2023-01-27' --> 'data\processed_data\BA\10-K_2023-01-27.md'


2025-11-14 15:40:56,375 - INFO - Going to convert document batch...
2025-11-14 15:40:56,376 - INFO - Processing document 10-K_2024-01-31
2025-11-14 15:41:01,591 - INFO - Finished converting document 10-K_2024-01-31 in 7.66 sec.
2025-11-14 15:41:03,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-K_2024-01-31' --> 'data\processed_data\BA\10-K_2024-01-31.md'


2025-11-14 15:41:07,284 - INFO - Going to convert document batch...
2025-11-14 15:41:07,285 - INFO - Processing document 10-K_2025-02-03
2025-11-14 15:41:13,152 - INFO - Finished converting document 10-K_2025-02-03 in 9.34 sec.
2025-11-14 15:41:15,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-K_2025-02-03' --> 'data\processed_data\BA\10-K_2025-02-03.md'


2025-11-14 15:41:16,334 - INFO - Going to convert document batch...
2025-11-14 15:41:16,336 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 15:41:19,607 - INFO - Finished converting document 10-Q_2023-04-26 in 4.20 sec.
2025-11-14 15:41:20,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2023-04-26' --> 'data\processed_data\BA\10-Q_2023-04-26.md'


2025-11-14 15:41:22,048 - INFO - Going to convert document batch...
2025-11-14 15:41:22,050 - INFO - Processing document 10-Q_2023-07-26
2025-11-14 15:41:24,595 - INFO - Finished converting document 10-Q_2023-07-26 in 3.84 sec.
2025-11-14 15:41:25,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2023-07-26' --> 'data\processed_data\BA\10-Q_2023-07-26.md'


2025-11-14 15:41:28,028 - INFO - Going to convert document batch...
2025-11-14 15:41:28,029 - INFO - Processing document 10-Q_2023-10-25
2025-11-14 15:41:30,736 - INFO - Finished converting document 10-Q_2023-10-25 in 4.89 sec.
2025-11-14 15:41:32,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2023-10-25' --> 'data\processed_data\BA\10-Q_2023-10-25.md'


2025-11-14 15:41:32,947 - INFO - Going to convert document batch...
2025-11-14 15:41:32,949 - INFO - Processing document 10-Q_2024-04-24
2025-11-14 15:41:35,284 - INFO - Finished converting document 10-Q_2024-04-24 in 3.30 sec.
2025-11-14 15:41:36,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2024-04-24' --> 'data\processed_data\BA\10-Q_2024-04-24.md'


2025-11-14 15:41:38,247 - INFO - Going to convert document batch...
2025-11-14 15:41:38,248 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 15:41:41,291 - INFO - Finished converting document 10-Q_2024-07-31 in 4.72 sec.
2025-11-14 15:41:42,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2024-07-31' --> 'data\processed_data\BA\10-Q_2024-07-31.md'


2025-11-14 15:41:44,651 - INFO - Going to convert document batch...
2025-11-14 15:41:44,653 - INFO - Processing document 10-Q_2024-10-23
2025-11-14 15:41:47,398 - INFO - Finished converting document 10-Q_2024-10-23 in 4.77 sec.
2025-11-14 15:41:49,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2024-10-23' --> 'data\processed_data\BA\10-Q_2024-10-23.md'


2025-11-14 15:41:50,013 - INFO - Going to convert document batch...
2025-11-14 15:41:50,020 - INFO - Processing document 10-Q_2025-04-23
2025-11-14 15:41:52,518 - INFO - Finished converting document 10-Q_2025-04-23 in 3.56 sec.
2025-11-14 15:41:54,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2025-04-23' --> 'data\processed_data\BA\10-Q_2025-04-23.md'


2025-11-14 15:41:56,332 - INFO - Going to convert document batch...
2025-11-14 15:41:56,334 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 15:41:59,271 - INFO - Finished converting document 10-Q_2025-07-29 in 4.61 sec.
2025-11-14 15:42:00,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2025-07-29' --> 'data\processed_data\BA\10-Q_2025-07-29.md'


2025-11-14 15:42:02,335 - INFO - Going to convert document batch...
2025-11-14 15:42:02,336 - INFO - Processing document 10-Q_2025-10-29
2025-11-14 15:42:05,391 - INFO - Finished converting document 10-Q_2025-10-29 in 4.80 sec.
2025-11-14 15:42:07,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:07,062 - INFO - Going to convert document batch...
2025-11-14 15:42:07,064 - INFO - Processing document 4_2023-01-05
2025-11-14 15:42:07,122 - INFO - Finished converting document 4_2023-01-05 in 0.12 sec.


Converted 'data\edgar_documents\BA\10-Q_2025-10-29' --> 'data\processed_data\BA\10-Q_2025-10-29.md'
Converted 'data\edgar_documents\BA\4_2023-01-05' --> 'data\processed_data\BA\4_2023-01-05.md'


2025-11-14 15:42:07,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:07,279 - INFO - Going to convert document batch...
2025-11-14 15:42:07,281 - INFO - Processing document 4_2023-02-21
2025-11-14 15:42:07,341 - INFO - Finished converting document 4_2023-02-21 in 0.14 sec.
2025-11-14 15:42:07,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:07,439 - INFO - Going to convert document batch...
2025-11-14 15:42:07,441 - INFO - Processing document 4_2023-02-28
2025-11-14 15:42:07,494 - INFO - Finished converting document 4_2023-02-28 in 0.09 sec.
2025-11-14 15:42:07,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2023-02-21' --> 'data\processed_data\BA\4_2023-02-21.md'
Converted 'data\edgar_documents\BA\4_2023-02-28' --> 'data\processed_data\BA\4_2023-02-28.md'


2025-11-14 15:42:07,609 - INFO - Going to convert document batch...
2025-11-14 15:42:07,611 - INFO - Processing document 4_2023-04-05
2025-11-14 15:42:07,674 - INFO - Finished converting document 4_2023-04-05 in 0.12 sec.
2025-11-14 15:42:07,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:07,753 - INFO - Going to convert document batch...
2025-11-14 15:42:07,756 - INFO - Processing document 4_2023-04-18
2025-11-14 15:42:07,810 - INFO - Finished converting document 4_2023-04-18 in 0.09 sec.
2025-11-14 15:42:07,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2023-04-05' --> 'data\processed_data\BA\4_2023-04-05.md'
Converted 'data\edgar_documents\BA\4_2023-04-18' --> 'data\processed_data\BA\4_2023-04-18.md'


2025-11-14 15:42:07,954 - INFO - Going to convert document batch...
2025-11-14 15:42:07,956 - INFO - Processing document 4_2023-05-03
2025-11-14 15:42:08,046 - INFO - Finished converting document 4_2023-05-03 in 0.16 sec.
2025-11-14 15:42:08,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:08,175 - INFO - Going to convert document batch...
2025-11-14 15:42:08,177 - INFO - Processing document 4_2023-05-08
2025-11-14 15:42:08,245 - INFO - Finished converting document 4_2023-05-08 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2023-05-03' --> 'data\processed_data\BA\4_2023-05-03.md'


2025-11-14 15:42:08,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:08,375 - INFO - Going to convert document batch...
2025-11-14 15:42:08,378 - INFO - Processing document 4_2023-07-06
2025-11-14 15:42:08,457 - INFO - Finished converting document 4_2023-07-06 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2023-05-08' --> 'data\processed_data\BA\4_2023-05-08.md'


2025-11-14 15:42:08,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:08,596 - INFO - Going to convert document batch...
2025-11-14 15:42:08,598 - INFO - Processing document 4_2023-07-10
2025-11-14 15:42:08,669 - INFO - Finished converting document 4_2023-07-10 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2023-07-06' --> 'data\processed_data\BA\4_2023-07-06.md'
Converted 'data\edgar_documents\BA\4_2023-07-10' --> 'data\processed_data\BA\4_2023-07-10.md'


2025-11-14 15:42:08,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,033 - INFO - Going to convert document batch...
2025-11-14 15:42:09,035 - INFO - Processing document 4_2023-08-02
2025-11-14 15:42:09,097 - INFO - Finished converting document 4_2023-08-02 in 0.34 sec.
2025-11-14 15:42:09,158 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,172 - INFO - Going to convert document batch...
2025-11-14 15:42:09,173 - INFO - Processing document 4_2023-08-03
2025-11-14 15:42:09,245 - INFO - Finished converting document 4_2023-08-03 in 0.11 sec.
2025-11-14 15:42:09,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2023-08-02' --> 'data\processed_data\BA\4_2023-08-02.md'
Converted 'data\edgar_documents\BA\4_2023-08-03' --> 'data\processed_data\BA\4_2023-08-03.md'


2025-11-14 15:42:09,356 - INFO - Going to convert document batch...
2025-11-14 15:42:09,357 - INFO - Processing document 4_2023-10-04
2025-11-14 15:42:09,396 - INFO - Finished converting document 4_2023-10-04 in 0.09 sec.
2025-11-14 15:42:09,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,537 - INFO - Going to convert document batch...
2025-11-14 15:42:09,538 - INFO - Processing document 4_2023-12-05
2025-11-14 15:42:09,582 - INFO - Finished converting document 4_2023-12-05 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2023-10-04' --> 'data\processed_data\BA\4_2023-10-04.md'
Converted 'data\edgar_documents\BA\4_2023-12-05' --> 'data\processed_data\BA\4_2023-12-05.md'


2025-11-14 15:42:09,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,700 - INFO - Going to convert document batch...
2025-11-14 15:42:09,702 - INFO - Processing document 4_2023-12-18
2025-11-14 15:42:09,760 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.
2025-11-14 15:42:09,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,845 - INFO - Going to convert document batch...
2025-11-14 15:42:09,846 - INFO - Processing document 4_2024-01-04
2025-11-14 15:42:09,924 - INFO - Finished converting document 4_2024-01-04 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2023-12-18' --> 'data\processed_data\BA\4_2023-12-18.md'
Converted 'data\edgar_documents\BA\4_2024-01-04' --> 'data\processed_data\BA\4_2024-01-04.md'


2025-11-14 15:42:10,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:10,055 - INFO - Going to convert document batch...
2025-11-14 15:42:10,057 - INFO - Processing document 4_2024-01-22
2025-11-14 15:42:10,178 - INFO - Finished converting document 4_2024-01-22 in 0.20 sec.
2025-11-14 15:42:10,238 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:10,253 - INFO - Going to convert document batch...
2025-11-14 15:42:10,254 - INFO - Processing document 4_2024-02-21
2025-11-14 15:42:10,285 - INFO - Finished converting document 4_2024-02-21 in 0.06 sec.
2025-11-14 15:42:10,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2024-01-22' --> 'data\processed_data\BA\4_2024-01-22.md'
Converted 'data\edgar_documents\BA\4_2024-02-21' --> 'data\processed_data\BA\4_2024-02-21.md'


2025-11-14 15:42:10,401 - INFO - Going to convert document batch...
2025-11-14 15:42:10,404 - INFO - Processing document 4_2024-02-22
2025-11-14 15:42:10,472 - INFO - Finished converting document 4_2024-02-22 in 0.14 sec.
2025-11-14 15:42:10,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:10,602 - INFO - Going to convert document batch...
2025-11-14 15:42:10,604 - INFO - Processing document 4_2024-03-01
2025-11-14 15:42:10,685 - INFO - Finished converting document 4_2024-03-01 in 0.16 sec.


Converted 'data\edgar_documents\BA\4_2024-02-22' --> 'data\processed_data\BA\4_2024-02-22.md'


2025-11-14 15:42:10,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:10,832 - INFO - Going to convert document batch...
2025-11-14 15:42:10,833 - INFO - Processing document 4_2024-03-13
2025-11-14 15:42:10,898 - INFO - Finished converting document 4_2024-03-13 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2024-03-01' --> 'data\processed_data\BA\4_2024-03-01.md'
Converted 'data\edgar_documents\BA\4_2024-03-13' --> 'data\processed_data\BA\4_2024-03-13.md'


2025-11-14 15:42:11,004 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:11,047 - INFO - Going to convert document batch...
2025-11-14 15:42:11,048 - INFO - Processing document 4_2024-04-03
2025-11-14 15:42:11,120 - INFO - Finished converting document 4_2024-04-03 in 0.17 sec.
2025-11-14 15:42:11,227 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:11,228 - ERROR - Input document 4_2024-07-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:42

Converted 'data\edgar_documents\BA\4_2024-04-03' --> 'data\processed_data\BA\4_2024-04-03.md'
Error processing data\edgar_documents\BA\4_2024-07-01: File format not allowed: data\edgar_documents\BA\4_2024-07-01


2025-11-14 15:42:11,463 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:11,465 - ERROR - Input document 4_2024-07-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:42:11,467 - INFO - Going to convert document batch...
2025-11-14 15:42:11,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:11,548 - INFO - Going to convert document batch...
2025-11-14 15:42:11,550 - INFO - Processing document 4_2024-08-09


Converted 'data\edgar_documents\BA\4_2024-07-03' --> 'data\processed_data\BA\4_2024-07-03.md'
Error processing data\edgar_documents\BA\4_2024-07-31: File format not allowed: data\edgar_documents\BA\4_2024-07-31


2025-11-14 15:42:11,613 - INFO - Finished converting document 4_2024-08-09 in 0.14 sec.
2025-11-14 15:42:11,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:11,736 - INFO - Going to convert document batch...
2025-11-14 15:42:11,738 - INFO - Processing document 4_2024-08-29
2025-11-14 15:42:11,804 - INFO - Finished converting document 4_2024-08-29 in 0.11 sec.


Converted 'data\edgar_documents\BA\4_2024-08-09' --> 'data\processed_data\BA\4_2024-08-09.md'
Converted 'data\edgar_documents\BA\4_2024-08-29' --> 'data\processed_data\BA\4_2024-08-29.md'


2025-11-14 15:42:11,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:11,951 - INFO - Going to convert document batch...
2025-11-14 15:42:11,954 - INFO - Processing document 4_2024-09-05
2025-11-14 15:42:12,039 - INFO - Finished converting document 4_2024-09-05 in 0.16 sec.
2025-11-14 15:42:12,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:12,170 - INFO - Going to convert document batch...
2025-11-14 15:42:12,172 - INFO - Processing document 4_2024-10-03
2025-11-14 15:42:12,237 - INFO - Finished converting document 4_2024-10-03 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2024-09-05' --> 'data\processed_data\BA\4_2024-09-05.md'
Converted 'data\edgar_documents\BA\4_2024-10-03' --> 'data\processed_data\BA\4_2024-10-03.md'


2025-11-14 15:42:12,519 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:12,522 - ERROR - Input document 4_2024-10-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:42:12,526 - INFO - Going to convert document batch...
2025-11-14 15:42:12,556 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:12,559 - ERROR - Input document 4_2024-10-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\BA\4_2024-10-28: File format not allowed: data\edgar_documents\BA\4_2024-10-28
Error processing data\edgar_documents\BA\4_2024-10-29: File format not allowed: data\edgar_documents\BA\4_2024-10-29
Error processing data\edgar_documents\BA\4_2024-11-18: File format not allowed: data\edgar_documents\BA\4_2024-11-18


2025-11-14 15:42:12,877 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:12,879 - ERROR - Input document 4_2024-12-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:42:12,884 - INFO - Going to convert document batch...
2025-11-14 15:42:12,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:12,955 - INFO - Going to convert document batch...
2025-11-14 15:42:12,957 - INFO - Processing document 4_2025-01-03


Converted 'data\edgar_documents\BA\4_2024-12-04' --> 'data\processed_data\BA\4_2024-12-04.md'
Error processing data\edgar_documents\BA\4_2024-12-20: File format not allowed: data\edgar_documents\BA\4_2024-12-20


2025-11-14 15:42:13,119 - INFO - Finished converting document 4_2025-01-03 in 0.23 sec.
2025-11-14 15:42:13,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:13,198 - INFO - Going to convert document batch...
2025-11-14 15:42:13,199 - INFO - Processing document 4_2025-01-06
2025-11-14 15:42:13,239 - INFO - Finished converting document 4_2025-01-06 in 0.06 sec.
2025-11-14 15:42:13,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2025-01-03' --> 'data\processed_data\BA\4_2025-01-03.md'
Converted 'data\edgar_documents\BA\4_2025-01-06' --> 'data\processed_data\BA\4_2025-01-06.md'


2025-11-14 15:42:13,364 - INFO - Going to convert document batch...
2025-11-14 15:42:13,366 - INFO - Processing document 4_2025-01-17
2025-11-14 15:42:13,410 - INFO - Finished converting document 4_2025-01-17 in 0.12 sec.
2025-11-14 15:42:13,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:13,525 - INFO - Going to convert document batch...
2025-11-14 15:42:13,526 - INFO - Processing document 4_2025-02-20
2025-11-14 15:42:13,561 - INFO - Finished converting document 4_2025-02-20 in 0.11 sec.


Converted 'data\edgar_documents\BA\4_2025-01-17' --> 'data\processed_data\BA\4_2025-01-17.md'
Converted 'data\edgar_documents\BA\4_2025-02-20' --> 'data\processed_data\BA\4_2025-02-20.md'


2025-11-14 15:42:13,637 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:13,669 - INFO - Going to convert document batch...
2025-11-14 15:42:13,670 - INFO - Processing document 4_2025-02-21
2025-11-14 15:42:13,711 - INFO - Finished converting document 4_2025-02-21 in 0.11 sec.
2025-11-14 15:42:13,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:13,789 - INFO - Going to convert document batch...
2025-11-14 15:42:13,792 - INFO - Processing document 4_2025-02-26
2025-11-14 15:42:13,871 - INFO - Finished converting document 4_2025-02-26 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2025-02-21' --> 'data\processed_data\BA\4_2025-02-21.md'
Converted 'data\edgar_documents\BA\4_2025-02-26' --> 'data\processed_data\BA\4_2025-02-26.md'


2025-11-14 15:42:14,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:14,098 - INFO - Going to convert document batch...
2025-11-14 15:42:14,101 - INFO - Processing document 4_2025-02-28
2025-11-14 15:42:14,188 - INFO - Finished converting document 4_2025-02-28 in 0.25 sec.
2025-11-14 15:42:14,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:14,317 - INFO - Going to convert document batch...
2025-11-14 15:42:14,319 - INFO - Processing document 4_2025-03-11
2025-11-14 15:42:14,388 - INFO - Finished converting document 4_2025-03-11 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2025-02-28' --> 'data\processed_data\BA\4_2025-02-28.md'


2025-11-14 15:42:14,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2025-03-11' --> 'data\processed_data\BA\4_2025-03-11.md'


2025-11-14 15:42:15,635 - INFO - Going to convert document batch...
2025-11-14 15:42:15,637 - INFO - Processing document 4_2025-04-03
2025-11-14 15:42:15,696 - INFO - Finished converting document 4_2025-04-03 in 1.23 sec.
2025-11-14 15:42:15,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:15,793 - INFO - Going to convert document batch...
2025-11-14 15:42:15,794 - INFO - Processing document 4_2025-05-05
2025-11-14 15:42:15,831 - INFO - Finished converting document 4_2025-05-05 in 0.09 sec.


Converted 'data\edgar_documents\BA\4_2025-04-03' --> 'data\processed_data\BA\4_2025-04-03.md'
Converted 'data\edgar_documents\BA\4_2025-05-05' --> 'data\processed_data\BA\4_2025-05-05.md'


2025-11-14 15:42:15,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,026 - INFO - Going to convert document batch...
2025-11-14 15:42:16,027 - INFO - Processing document 4_2025-05-08
2025-11-14 15:42:16,089 - INFO - Finished converting document 4_2025-05-08 in 0.24 sec.
2025-11-14 15:42:16,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,202 - INFO - Going to convert document batch...
2025-11-14 15:42:16,204 - INFO - Processing document 4_2025-05-15
2025-11-14 15:42:16,245 - INFO - Finished converting document 4_2025-05-15 in 0.09 sec.
2025-11-14 15:42:16,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,325 - INFO - Going to convert document batch...
2025-11-14 15:42:16,326 - INFO - Processing document 4_2025-05-19
2025-11-14 15:42:16,361 - INFO - Finished converting document 4_2025-05-19 in 0.08 sec.


Converted 'data\edgar_documents\BA\4_2025-05-08' --> 'data\processed_data\BA\4_2025-05-08.md'
Converted 'data\edgar_documents\BA\4_2025-05-15' --> 'data\processed_data\BA\4_2025-05-15.md'


2025-11-14 15:42:16,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,427 - INFO - Going to convert document batch...
2025-11-14 15:42:16,429 - INFO - Processing document 4_2025-07-03
2025-11-14 15:42:16,485 - INFO - Finished converting document 4_2025-07-03 in 0.09 sec.


Converted 'data\edgar_documents\BA\4_2025-05-19' --> 'data\processed_data\BA\4_2025-05-19.md'


2025-11-14 15:42:16,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,714 - INFO - Going to convert document batch...
2025-11-14 15:42:16,716 - INFO - Processing document 4_2025-07-31
2025-11-14 15:42:16,792 - INFO - Finished converting document 4_2025-07-31 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2025-07-03' --> 'data\processed_data\BA\4_2025-07-03.md'


2025-11-14 15:42:16,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,956 - INFO - Going to convert document batch...
2025-11-14 15:42:16,959 - INFO - Processing document 4_2025-08-12
2025-11-14 15:42:17,019 - INFO - Finished converting document 4_2025-08-12 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2025-07-31' --> 'data\processed_data\BA\4_2025-07-31.md'
Converted 'data\edgar_documents\BA\4_2025-08-12' --> 'data\processed_data\BA\4_2025-08-12.md'


2025-11-14 15:42:17,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:17,109 - INFO - Going to convert document batch...
2025-11-14 15:42:17,110 - INFO - Processing document 4_2025-08-19
2025-11-14 15:42:17,151 - INFO - Finished converting document 4_2025-08-19 in 0.09 sec.
2025-11-14 15:42:17,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:17,266 - INFO - Going to convert document batch...
2025-11-14 15:42:17,268 - INFO - Processing document 4_2025-08-21
2025-11-14 15:42:17,318 - INFO - Finished converting document 4_2025-08-21 in 0.11 sec.
2025-11-14 15:42:17,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2025-08-19' --> 'data\processed_data\BA\4_2025-08-19.md'
Converted 'data\edgar_documents\BA\4_2025-08-21' --> 'data\processed_data\BA\4_2025-08-21.md'


2025-11-14 15:42:17,416 - INFO - Going to convert document batch...
2025-11-14 15:42:17,417 - INFO - Processing document 4_2025-09-03
2025-11-14 15:42:17,480 - INFO - Finished converting document 4_2025-09-03 in 0.14 sec.
2025-11-14 15:42:17,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:17,629 - INFO - Going to convert document batch...
2025-11-14 15:42:17,631 - INFO - Processing document 4_2025-10-03
2025-11-14 15:42:17,694 - INFO - Finished converting document 4_2025-10-03 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2025-09-03' --> 'data\processed_data\BA\4_2025-09-03.md'
Converted 'data\edgar_documents\BA\4_2025-10-03' --> 'data\processed_data\BA\4_2025-10-03.md'


2025-11-14 15:42:17,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:17,834 - INFO - Going to convert document batch...
2025-11-14 15:42:17,835 - INFO - Processing document 4_2025-11-10
2025-11-14 15:42:17,882 - INFO - Finished converting document 4_2025-11-10 in 0.12 sec.
2025-11-14 15:42:17,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,014 - INFO - Going to convert document batch...
2025-11-14 15:42:18,016 - INFO - Processing document 8-K_2023-01-25
2025-11-14 15:42:18,049 - INFO - Finished converting document 8-K_2023-01-25 in 0.11 sec.
2025-11-14 15:42:18,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2025-11-10' --> 'data\processed_data\BA\4_2025-11-10.md'
Converted 'data\edgar_documents\BA\8-K_2023-01-25' --> 'data\processed_data\BA\8-K_2023-01-25.md'


2025-11-14 15:42:18,120 - INFO - Going to convert document batch...
2025-11-14 15:42:18,122 - INFO - Processing document 8-K_2023-02-17
2025-11-14 15:42:18,164 - INFO - Finished converting document 8-K_2023-02-17 in 0.09 sec.
2025-11-14 15:42:18,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,268 - INFO - Going to convert document batch...
2025-11-14 15:42:18,269 - INFO - Processing document 8-K_2023-03-15
2025-11-14 15:42:18,328 - INFO - Finished converting document 8-K_2023-03-15 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2023-02-17' --> 'data\processed_data\BA\8-K_2023-02-17.md'
Converted 'data\edgar_documents\BA\8-K_2023-03-15' --> 'data\processed_data\BA\8-K_2023-03-15.md'


2025-11-14 15:42:18,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,441 - INFO - Going to convert document batch...
2025-11-14 15:42:18,444 - INFO - Processing document 8-K_2023-04-11
2025-11-14 15:42:18,524 - INFO - Finished converting document 8-K_2023-04-11 in 0.16 sec.
2025-11-14 15:42:18,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,645 - INFO - Going to convert document batch...
2025-11-14 15:42:18,647 - INFO - Processing document 8-K_2023-04-19
2025-11-14 15:42:18,742 - INFO - Finished converting document 8-K_2023-04-19 in 0.19 sec.


Converted 'data\edgar_documents\BA\8-K_2023-04-11' --> 'data\processed_data\BA\8-K_2023-04-11.md'


2025-11-14 15:42:18,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,911 - INFO - Going to convert document batch...
2025-11-14 15:42:18,914 - INFO - Processing document 8-K_2023-04-26
2025-11-14 15:42:18,989 - INFO - Finished converting document 8-K_2023-04-26 in 0.16 sec.


Converted 'data\edgar_documents\BA\8-K_2023-04-19' --> 'data\processed_data\BA\8-K_2023-04-19.md'


2025-11-14 15:42:19,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,120 - INFO - Going to convert document batch...
2025-11-14 15:42:19,125 - INFO - Processing document 8-K_2023-07-26
2025-11-14 15:42:19,180 - INFO - Finished converting document 8-K_2023-07-26 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2023-04-26' --> 'data\processed_data\BA\8-K_2023-04-26.md'
Converted 'data\edgar_documents\BA\8-K_2023-07-26' --> 'data\processed_data\BA\8-K_2023-07-26.md'


2025-11-14 15:42:19,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,299 - INFO - Going to convert document batch...
2025-11-14 15:42:19,302 - INFO - Processing document 8-K_2023-08-24
2025-11-14 15:42:19,365 - INFO - Finished converting document 8-K_2023-08-24 in 0.16 sec.
2025-11-14 15:42:19,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,470 - INFO - Going to convert document batch...
2025-11-14 15:42:19,471 - INFO - Processing document 8-K_2023-09-05
2025-11-14 15:42:19,559 - INFO - Finished converting document 8-K_2023-09-05 in 0.16 sec.


Converted 'data\edgar_documents\BA\8-K_2023-08-24' --> 'data\processed_data\BA\8-K_2023-08-24.md'


2025-11-14 15:42:19,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,667 - INFO - Going to convert document batch...
2025-11-14 15:42:19,669 - INFO - Processing document 8-K_2023-09-22
2025-11-14 15:42:19,713 - INFO - Finished converting document 8-K_2023-09-22 in 0.12 sec.
2025-11-14 15:42:19,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\8-K_2023-09-05' --> 'data\processed_data\BA\8-K_2023-09-05.md'
Converted 'data\edgar_documents\BA\8-K_2023-09-22' --> 'data\processed_data\BA\8-K_2023-09-22.md'


2025-11-14 15:42:19,811 - INFO - Going to convert document batch...
2025-11-14 15:42:19,812 - INFO - Processing document 8-K_2023-10-25
2025-11-14 15:42:19,847 - INFO - Finished converting document 8-K_2023-10-25 in 0.11 sec.
2025-11-14 15:42:19,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,929 - INFO - Going to convert document batch...
2025-11-14 15:42:19,935 - INFO - Processing document 8-K_2023-12-11
2025-11-14 15:42:19,999 - INFO - Finished converting document 8-K_2023-12-11 in 0.12 sec.


Converted 'data\edgar_documents\BA\8-K_2023-10-25' --> 'data\processed_data\BA\8-K_2023-10-25.md'
Converted 'data\edgar_documents\BA\8-K_2023-12-11' --> 'data\processed_data\BA\8-K_2023-12-11.md'


2025-11-14 15:42:20,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,106 - INFO - Going to convert document batch...
2025-11-14 15:42:20,108 - INFO - Processing document 8-K_2024-01-31
2025-11-14 15:42:20,182 - INFO - Finished converting document 8-K_2024-01-31 in 0.16 sec.
2025-11-14 15:42:20,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,253 - INFO - Going to convert document batch...
2025-11-14 15:42:20,256 - INFO - Processing document 8-K_2024-03-25
2025-11-14 15:42:20,320 - INFO - Finished converting document 8-K_2024-03-25 in 0.09 sec.
2025-11-14 15:42:20,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\8-K_2024-01-31' --> 'data\processed_data\BA\8-K_2024-01-31.md'
Converted 'data\edgar_documents\BA\8-K_2024-03-25' --> 'data\processed_data\BA\8-K_2024-03-25.md'


2025-11-14 15:42:20,427 - INFO - Going to convert document batch...
2025-11-14 15:42:20,429 - INFO - Processing document 8-K_2024-04-24
2025-11-14 15:42:20,515 - INFO - Finished converting document 8-K_2024-04-24 in 0.16 sec.
2025-11-14 15:42:20,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,617 - INFO - Going to convert document batch...
2025-11-14 15:42:20,619 - INFO - Processing document 8-K_2024-05-03
2025-11-14 15:42:20,701 - INFO - Finished converting document 8-K_2024-05-03 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2024-04-24' --> 'data\processed_data\BA\8-K_2024-04-24.md'
Converted 'data\edgar_documents\BA\8-K_2024-05-03' --> 'data\processed_data\BA\8-K_2024-05-03.md'


2025-11-14 15:42:20,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,828 - INFO - Going to convert document batch...
2025-11-14 15:42:20,830 - INFO - Processing document 8-K_2024-05-17
2025-11-14 15:42:20,877 - INFO - Finished converting document 8-K_2024-05-17 in 0.14 sec.
2025-11-14 15:42:20,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,963 - INFO - Going to convert document batch...
2025-11-14 15:42:20,964 - INFO - Processing document 8-K_2024-07-01
2025-11-14 15:42:21,059 - INFO - Finished converting document 8-K_2024-07-01 in 0.16 sec.


Converted 'data\edgar_documents\BA\8-K_2024-05-17' --> 'data\processed_data\BA\8-K_2024-05-17.md'
Converted 'data\edgar_documents\BA\8-K_2024-07-01' --> 'data\processed_data\BA\8-K_2024-07-01.md'


2025-11-14 15:42:21,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,184 - INFO - Going to convert document batch...
2025-11-14 15:42:21,186 - INFO - Processing document 8-K_2024-07-31
2025-11-14 15:42:21,256 - INFO - Finished converting document 8-K_2024-07-31 in 0.16 sec.
2025-11-14 15:42:21,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,350 - INFO - Going to convert document batch...
2025-11-14 15:42:21,353 - INFO - Processing document 8-K_2024-09-13
2025-11-14 15:42:21,401 - INFO - Finished converting document 8-K_2024-09-13 in 0.11 sec.
2025-11-14 15:42:21,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\8-K_2024-07-31' --> 'data\processed_data\BA\8-K_2024-07-31.md'
Converted 'data\edgar_documents\BA\8-K_2024-09-13' --> 'data\processed_data\BA\8-K_2024-09-13.md'


2025-11-14 15:42:21,522 - INFO - Going to convert document batch...
2025-11-14 15:42:21,524 - INFO - Processing document 8-K_2024-09-20
2025-11-14 15:42:21,555 - INFO - Finished converting document 8-K_2024-09-20 in 0.12 sec.
2025-11-14 15:42:21,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,601 - INFO - Going to convert document batch...
2025-11-14 15:42:21,602 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:42:21,634 - INFO - Finished converting document 8-K_2024-10-11 in 0.06 sec.
2025-11-14 15:42:21,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,694 - INFO - Going to convert document batch...
2025-11-14 15:42:21,696 - INFO - Processing document 8-K_2024-10-15
2025-11-14 15:42:21,730 - INFO - Finished converting document 8-K_2024-10-15 in 0.08 sec.


Converted 'data\edgar_documents\BA\8-K_2024-09-20' --> 'data\processed_data\BA\8-K_2024-09-20.md'
Converted 'data\edgar_documents\BA\8-K_2024-10-11' --> 'data\processed_data\BA\8-K_2024-10-11.md'
Converted 'data\edgar_documents\BA\8-K_2024-10-15' --> 'data\processed_data\BA\8-K_2024-10-15.md'


2025-11-14 15:42:21,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,805 - INFO - Going to convert document batch...
2025-11-14 15:42:21,807 - INFO - Processing document 8-K_2024-10-23
2025-11-14 15:42:21,849 - INFO - Finished converting document 8-K_2024-10-23 in 0.09 sec.
2025-11-14 15:42:21,904 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,944 - INFO - Going to convert document batch...
2025-11-14 15:42:21,946 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:42:22,030 - INFO - Finished converting document 8-K_2024-10-30 in 0.17 sec.


Converted 'data\edgar_documents\BA\8-K_2024-10-23' --> 'data\processed_data\BA\8-K_2024-10-23.md'


2025-11-14 15:42:22,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,135 - INFO - Going to convert document batch...
2025-11-14 15:42:22,138 - INFO - Processing document 8-K_2024-10-31
2025-11-14 15:42:22,182 - INFO - Finished converting document 8-K_2024-10-31 in 0.12 sec.


Converted 'data\edgar_documents\BA\8-K_2024-10-30' --> 'data\processed_data\BA\8-K_2024-10-30.md'
Converted 'data\edgar_documents\BA\8-K_2024-10-31' --> 'data\processed_data\BA\8-K_2024-10-31.md'


2025-11-14 15:42:22,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,270 - INFO - Going to convert document batch...
2025-11-14 15:42:22,273 - INFO - Processing document 8-K_2024-11-18
2025-11-14 15:42:22,358 - INFO - Finished converting document 8-K_2024-11-18 in 0.16 sec.
2025-11-14 15:42:22,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,465 - INFO - Going to convert document batch...
2025-11-14 15:42:22,467 - INFO - Processing document 8-K_2025-01-23
2025-11-14 15:42:22,508 - INFO - Finished converting document 8-K_2025-01-23 in 0.08 sec.
2025-11-14 15:42:22,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,593 - INFO - Going to convert document batch...
2025-11-14 15:42:22,594 - INFO - Processing document 8-K_2025-01-28


Converted 'data\edgar_documents\BA\8-K_2024-11-18' --> 'data\processed_data\BA\8-K_2024-11-18.md'
Converted 'data\edgar_documents\BA\8-K_2025-01-23' --> 'data\processed_data\BA\8-K_2025-01-23.md'


2025-11-14 15:42:22,639 - INFO - Finished converting document 8-K_2025-01-28 in 0.11 sec.
2025-11-14 15:42:22,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,733 - INFO - Going to convert document batch...
2025-11-14 15:42:22,735 - INFO - Processing document 8-K_2025-02-25
2025-11-14 15:42:22,787 - INFO - Finished converting document 8-K_2025-02-25 in 0.12 sec.
2025-11-14 15:42:22,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\8-K_2025-01-28' --> 'data\processed_data\BA\8-K_2025-01-28.md'
Converted 'data\edgar_documents\BA\8-K_2025-02-25' --> 'data\processed_data\BA\8-K_2025-02-25.md'


2025-11-14 15:42:22,900 - INFO - Going to convert document batch...
2025-11-14 15:42:22,903 - INFO - Processing document 8-K_2025-04-23
2025-11-14 15:42:22,970 - INFO - Finished converting document 8-K_2025-04-23 in 0.16 sec.
2025-11-14 15:42:23,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,082 - INFO - Going to convert document batch...
2025-11-14 15:42:23,084 - INFO - Processing document 8-K_2025-04-24
2025-11-14 15:42:23,165 - INFO - Finished converting document 8-K_2025-04-24 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2025-04-23' --> 'data\processed_data\BA\8-K_2025-04-23.md'
Converted 'data\edgar_documents\BA\8-K_2025-04-24' --> 'data\processed_data\BA\8-K_2025-04-24.md'


2025-11-14 15:42:23,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,311 - INFO - Going to convert document batch...
2025-11-14 15:42:23,313 - INFO - Processing document 8-K_2025-06-04
2025-11-14 15:42:23,383 - INFO - Finished converting document 8-K_2025-06-04 in 0.16 sec.
2025-11-14 15:42:23,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,481 - INFO - Going to convert document batch...
2025-11-14 15:42:23,482 - INFO - Processing document 8-K_2025-07-03
2025-11-14 15:42:23,532 - INFO - Finished converting document 8-K_2025-07-03 in 0.12 sec.


Converted 'data\edgar_documents\BA\8-K_2025-06-04' --> 'data\processed_data\BA\8-K_2025-06-04.md'
Converted 'data\edgar_documents\BA\8-K_2025-07-03' --> 'data\processed_data\BA\8-K_2025-07-03.md'


2025-11-14 15:42:23,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,631 - INFO - Going to convert document batch...
2025-11-14 15:42:23,632 - INFO - Processing document 8-K_2025-07-29
2025-11-14 15:42:23,671 - INFO - Finished converting document 8-K_2025-07-29 in 0.12 sec.
2025-11-14 15:42:23,727 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,764 - INFO - Going to convert document batch...
2025-11-14 15:42:23,767 - INFO - Processing document 8-K_2025-08-28
2025-11-14 15:42:23,834 - INFO - Finished converting document 8-K_2025-08-28 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2025-07-29' --> 'data\processed_data\BA\8-K_2025-07-29.md'
Converted 'data\edgar_documents\BA\8-K_2025-08-28' --> 'data\processed_data\BA\8-K_2025-08-28.md'


2025-11-14 15:42:23,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,926 - INFO - Going to convert document batch...
2025-11-14 15:42:23,927 - INFO - Processing document 8-K_2025-10-29
2025-11-14 15:42:23,966 - INFO - Finished converting document 8-K_2025-10-29 in 0.11 sec.
2025-11-14 15:42:24,042 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:24,045 - ERROR - Input document DEF-14A_2023-03-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>

Converted 'data\edgar_documents\BA\8-K_2025-10-29' --> 'data\processed_data\BA\8-K_2025-10-29.md'
Error processing data\edgar_documents\BA\DEF-14A_2023-03-03: File format not allowed: data\edgar_documents\BA\DEF-14A_2023-03-03
Error processing data\edgar_documents\BA\DEF-14A_2024-04-05: File format not allowed: data\edgar_documents\BA\DEF-14A_2024-04-05
Error processing data\edgar_documents\BA\DEF-14A_2025-03-07: File format not allowed: data\edgar_documents\BA\DEF-14A_2025-03-07
Processed 97 new files. Errors: 9
Found 128 files to process in data\edgar_documents\BK


2025-11-14 15:42:24,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:26,024 - INFO - Going to convert document batch...
2025-11-14 15:42:26,025 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:42:26,026 - INFO - Processing document 10-K_2023-02-27
2025-11-14 15:42:27,243 - INFO - Finished converting document 10-K_2023-02-27 in 3.06 sec.
2025-11-14 15:42:27,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-K_2023-02-27' --> 'data\processed_data\BK\10-K_2023-02-27.md'


2025-11-14 15:42:29,455 - INFO - Going to convert document batch...
2025-11-14 15:42:29,458 - INFO - Processing document 10-K_2024-02-28
2025-11-14 15:42:30,683 - INFO - Finished converting document 10-K_2024-02-28 in 3.06 sec.
2025-11-14 15:42:31,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-K_2024-02-28' --> 'data\processed_data\BK\10-K_2024-02-28.md'


2025-11-14 15:42:32,229 - INFO - Going to convert document batch...
2025-11-14 15:42:32,231 - INFO - Processing document 10-K_2025-02-27
2025-11-14 15:42:33,382 - INFO - Finished converting document 10-K_2025-02-27 in 2.34 sec.


Converted 'data\edgar_documents\BK\10-K_2025-02-27' --> 'data\processed_data\BK\10-K_2025-02-27.md'


2025-11-14 15:42:33,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:40,259 - INFO - Going to convert document batch...
2025-11-14 15:42:40,261 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 15:42:48,167 - INFO - Finished converting document 10-Q_2023-05-05 in 14.45 sec.
2025-11-14 15:42:49,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2023-05-05' --> 'data\processed_data\BK\10-Q_2023-05-05.md'


2025-11-14 15:42:51,900 - INFO - Going to convert document batch...
2025-11-14 15:42:51,900 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 15:42:56,416 - INFO - Finished converting document 10-Q_2023-08-04 in 7.17 sec.
2025-11-14 15:42:57,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2023-08-04' --> 'data\processed_data\BK\10-Q_2023-08-04.md'


2025-11-14 15:43:00,216 - INFO - Going to convert document batch...
2025-11-14 15:43:00,217 - INFO - Processing document 10-Q_2023-11-03
2025-11-14 15:43:04,951 - INFO - Finished converting document 10-Q_2023-11-03 in 7.23 sec.
2025-11-14 15:43:07,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2023-11-03' --> 'data\processed_data\BK\10-Q_2023-11-03.md'


2025-11-14 15:43:09,139 - INFO - Going to convert document batch...
2025-11-14 15:43:09,140 - INFO - Processing document 10-Q_2024-05-03
2025-11-14 15:43:12,916 - INFO - Finished converting document 10-Q_2024-05-03 in 5.77 sec.
2025-11-14 15:43:14,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2024-05-03' --> 'data\processed_data\BK\10-Q_2024-05-03.md'


2025-11-14 15:43:16,606 - INFO - Going to convert document batch...
2025-11-14 15:43:16,607 - INFO - Processing document 10-Q_2024-08-02
2025-11-14 15:43:21,775 - INFO - Finished converting document 10-Q_2024-08-02 in 7.67 sec.
2025-11-14 15:43:23,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2024-08-02' --> 'data\processed_data\BK\10-Q_2024-08-02.md'


2025-11-14 15:43:25,725 - INFO - Going to convert document batch...
2025-11-14 15:43:25,726 - INFO - Processing document 10-Q_2024-11-01
2025-11-14 15:43:30,477 - INFO - Finished converting document 10-Q_2024-11-01 in 7.38 sec.


Converted 'data\edgar_documents\BK\10-Q_2024-11-01' --> 'data\processed_data\BK\10-Q_2024-11-01.md'


2025-11-14 15:43:32,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:34,189 - INFO - Going to convert document batch...
2025-11-14 15:43:34,190 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 15:43:37,886 - INFO - Finished converting document 10-Q_2025-05-02 in 6.09 sec.
2025-11-14 15:43:39,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2025-05-02' --> 'data\processed_data\BK\10-Q_2025-05-02.md'


2025-11-14 15:43:41,569 - INFO - Going to convert document batch...
2025-11-14 15:43:41,571 - INFO - Processing document 10-Q_2025-08-01
2025-11-14 15:43:46,608 - INFO - Finished converting document 10-Q_2025-08-01 in 7.53 sec.
2025-11-14 15:43:48,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2025-08-01' --> 'data\processed_data\BK\10-Q_2025-08-01.md'


2025-11-14 15:43:50,486 - INFO - Going to convert document batch...
2025-11-14 15:43:50,487 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 15:43:55,093 - INFO - Finished converting document 10-Q_2025-10-31 in 7.20 sec.
2025-11-14 15:43:56,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,450 - INFO - Going to convert document batch...
2025-11-14 15:43:56,451 - INFO - Processing document 4_2023-01-19
2025-11-14 15:43:56,470 - INFO - Finished converting document 4_2023-01-19 in 0.06 sec.
2025-11-14 15:43:56,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,548 - INFO - Going to convert document batch...
2025-11-14 15:43:56,549 - INFO - Processing document 4_2023-01-24
2025-11-14 15:43:56,569 - INFO - Finished converting document 4_2023-01-24 in 0.05 sec.
2025-11-14 15:43:56,601 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BK\10-Q_2025-10-31' --> 'data\processed_data\BK\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\BK\4_2023-01-19' --> 'data\processed_data\BK\4_2023-01-19.md'
Converted 'data\edgar_documents\BK\4_2023-01-24' --> 'data\processed_data\BK\4_2023-01-24.md'


2025-11-14 15:43:56,601 - ERROR - Input document 4_2023-01-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:56,602 - INFO - Going to convert document batch...
2025-11-14 15:43:56,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,622 - INFO - Going to convert document batch...
2025-11-14 15:43:56,623 - INFO - Processing document 4_2023-02-03
2025-11-14 15:43:56,641 - INFO - Finished converting document 4_2023-02-03 in 0.05 sec.
2025-11-14 15:43:56,670 - INFO - detec

Error processing data\edgar_documents\BK\4_2023-01-26: File format not allowed: data\edgar_documents\BK\4_2023-01-26
Converted 'data\edgar_documents\BK\4_2023-02-03' --> 'data\processed_data\BK\4_2023-02-03.md'
Converted 'data\edgar_documents\BK\4_2023-02-10' --> 'data\processed_data\BK\4_2023-02-10.md'
Converted 'data\edgar_documents\BK\4_2023-02-14' --> 'data\processed_data\BK\4_2023-02-14.md'


2025-11-14 15:43:56,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,809 - INFO - Going to convert document batch...
2025-11-14 15:43:56,810 - INFO - Processing document 4_2023-02-15
2025-11-14 15:43:56,830 - INFO - Finished converting document 4_2023-02-15 in 0.05 sec.
2025-11-14 15:43:56,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,890 - INFO - Going to convert document batch...
2025-11-14 15:43:56,891 - INFO - Processing document 4_2023-02-17
2025-11-14 15:43:56,910 - INFO - Finished converting document 4_2023-02-17 in 0.06 sec.
2025-11-14 15:43:56,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,948 - INFO - Going to convert document batch...
2025-11-14 15:43:56,949 - INFO - Processing document 4_2023-02-21
2025-11-14 15:43:56,964 - INFO - Finished converting document 4_2023-02-21 in 0.05 sec.
2025-11-14 15:43:56,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\BK\4_2023-02-15' --> 'data\processed_data\BK\4_2023-02-15.md'
Converted 'data\edgar_documents\BK\4_2023-02-17' --> 'data\processed_data\BK\4_2023-02-17.md'
Converted 'data\edgar_documents\BK\4_2023-02-21' --> 'data\processed_data\BK\4_2023-02-21.md'


2025-11-14 15:43:57,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,061 - INFO - Going to convert document batch...
2025-11-14 15:43:57,061 - INFO - Processing document 4_2023-03-03
2025-11-14 15:43:57,078 - INFO - Finished converting document 4_2023-03-03 in 0.03 sec.
2025-11-14 15:43:57,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,116 - INFO - Going to convert document batch...
2025-11-14 15:43:57,116 - INFO - Processing document 4_2023-03-10
2025-11-14 15:43:57,135 - INFO - Finished converting document 4_2023-03-10 in 0.03 sec.
2025-11-14 15:43:57,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,174 - INFO - Going to convert document batch...
2025-11-14 15:43:57,175 - INFO - Processing document 4_2023-04-05
2025-11-14 15:43:57,193 - INFO - Finished converting document 4_2023-04-05 in 0.03 sec.
2025-11-14 15:43:57,230 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BK\4_2023-02-28' --> 'data\processed_data\BK\4_2023-02-28.md'
Converted 'data\edgar_documents\BK\4_2023-03-03' --> 'data\processed_data\BK\4_2023-03-03.md'
Converted 'data\edgar_documents\BK\4_2023-03-10' --> 'data\processed_data\BK\4_2023-03-10.md'
Converted 'data\edgar_documents\BK\4_2023-04-05' --> 'data\processed_data\BK\4_2023-04-05.md'


2025-11-14 15:43:57,231 - ERROR - Input document 4_2023-04-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:57,232 - INFO - Going to convert document batch...
2025-11-14 15:43:57,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,251 - INFO - Going to convert document batch...
2025-11-14 15:43:57,252 - INFO - Processing document 4_2023-04-21
2025-11-14 15:43:57,275 - INFO - Finished converting document 4_2023-04-21 in 0.03 sec.
2025-11-14 15:43:57,310 - INFO - detec

Error processing data\edgar_documents\BK\4_2023-04-19: File format not allowed: data\edgar_documents\BK\4_2023-04-19
Converted 'data\edgar_documents\BK\4_2023-04-21' --> 'data\processed_data\BK\4_2023-04-21.md'
Converted 'data\edgar_documents\BK\4_2023-07-06' --> 'data\processed_data\BK\4_2023-07-06.md'
Converted 'data\edgar_documents\BK\4_2023-07-21' --> 'data\processed_data\BK\4_2023-07-21.md'


2025-11-14 15:43:57,440 - INFO - Going to convert document batch...
2025-11-14 15:43:57,442 - INFO - Processing document 4_2023-08-01
2025-11-14 15:43:57,468 - INFO - Finished converting document 4_2023-08-01 in 0.05 sec.
2025-11-14 15:43:57,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,522 - INFO - Going to convert document batch...
2025-11-14 15:43:57,523 - INFO - Processing document 4_2023-08-07
2025-11-14 15:43:57,542 - INFO - Finished converting document 4_2023-08-07 in 0.05 sec.
2025-11-14 15:43:57,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,583 - INFO - Going to convert document batch...
2025-11-14 15:43:57,583 - INFO - Processing document 4_2023-08-14


Converted 'data\edgar_documents\BK\4_2023-08-01' --> 'data\processed_data\BK\4_2023-08-01.md'
Converted 'data\edgar_documents\BK\4_2023-08-07' --> 'data\processed_data\BK\4_2023-08-07.md'


2025-11-14 15:43:58,511 - INFO - Finished converting document 4_2023-08-14 in 0.95 sec.
2025-11-14 15:43:58,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,550 - INFO - Going to convert document batch...
2025-11-14 15:43:58,551 - INFO - Processing document 4_2023-10-04
2025-11-14 15:43:58,568 - INFO - Finished converting document 4_2023-10-04 in 0.03 sec.
2025-11-14 15:43:58,598 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:43:58,599 - ERROR - Input document 4_2023-10-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\BK\4_2023-08-14' --> 'data\processed_data\BK\4_2023-08-14.md'
Converted 'data\edgar_documents\BK\4_2023-10-04' --> 'data\processed_data\BK\4_2023-10-04.md'
Error processing data\edgar_documents\BK\4_2023-10-18: File format not allowed: data\edgar_documents\BK\4_2023-10-18
Error processing data\edgar_documents\BK\4_2023-10-19: File format not allowed: data\edgar_documents\BK\4_2023-10-19
Converted 'data\edgar_documents\BK\4_2024-01-17' --> 'data\processed_data\BK\4_2024-01-17.md'


2025-11-14 15:43:58,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,750 - INFO - Going to convert document batch...
2025-11-14 15:43:58,751 - INFO - Processing document 4_2024-02-05
2025-11-14 15:43:58,768 - INFO - Finished converting document 4_2024-02-05 in 0.03 sec.
2025-11-14 15:43:58,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,808 - INFO - Going to convert document batch...
2025-11-14 15:43:58,809 - INFO - Processing document 4_2024-02-09
2025-11-14 15:43:58,827 - INFO - Finished converting document 4_2024-02-09 in 0.05 sec.
2025-11-14 15:43:58,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,865 - INFO - Going to convert document batch...
2025-11-14 15:43:58,866 - INFO - Processing document 4_2024-02-12
2025-11-14 15:43:58,883 - INFO - Finished converting document 4_2024-02-12 in 0.03 sec.
2025-11-14 15:43:58,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\4_2024-02-02' --> 'data\processed_data\BK\4_2024-02-02.md'
Converted 'data\edgar_documents\BK\4_2024-02-05' --> 'data\processed_data\BK\4_2024-02-05.md'
Converted 'data\edgar_documents\BK\4_2024-02-09' --> 'data\processed_data\BK\4_2024-02-09.md'
Converted 'data\edgar_documents\BK\4_2024-02-12' --> 'data\processed_data\BK\4_2024-02-12.md'


2025-11-14 15:43:58,926 - INFO - Going to convert document batch...
2025-11-14 15:43:58,926 - INFO - Processing document 4_2024-02-13
2025-11-14 15:43:58,943 - INFO - Finished converting document 4_2024-02-13 in 0.03 sec.
2025-11-14 15:43:58,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,985 - INFO - Going to convert document batch...
2025-11-14 15:43:58,986 - INFO - Processing document 4_2024-02-20
2025-11-14 15:43:59,008 - INFO - Finished converting document 4_2024-02-20 in 0.03 sec.
2025-11-14 15:43:59,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,052 - INFO - Going to convert document batch...
2025-11-14 15:43:59,053 - INFO - Processing document 4_2024-02-27
2025-11-14 15:43:59,075 - INFO - Finished converting document 4_2024-02-27 in 0.05 sec.
2025-11-14 15:43:59,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,113 - INFO - Going to convert document batch...
2025-11-14 15:43:59,113 - 

Converted 'data\edgar_documents\BK\4_2024-02-13' --> 'data\processed_data\BK\4_2024-02-13.md'
Converted 'data\edgar_documents\BK\4_2024-02-20' --> 'data\processed_data\BK\4_2024-02-20.md'
Converted 'data\edgar_documents\BK\4_2024-02-27' --> 'data\processed_data\BK\4_2024-02-27.md'
Converted 'data\edgar_documents\BK\4_2024-03-01' --> 'data\processed_data\BK\4_2024-03-01.md'


2025-11-14 15:43:59,165 - ERROR - Input document 4_2024-03-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:59,166 - INFO - Going to convert document batch...
2025-11-14 15:43:59,179 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:43:59,179 - ERROR - Input document 4_2024-03-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\BK\4_2024-03-07: File format not allowed: data\edgar_documents\BK\4_2024-03-07
Error processing data\edgar_documents\BK\4_2024-03-08: File format not allowed: data\edgar_documents\BK\4_2024-03-08
Converted 'data\edgar_documents\BK\4_2024-04-03' --> 'data\processed_data\BK\4_2024-04-03.md'
Converted 'data\edgar_documents\BK\4_2024-04-19' --> 'data\processed_data\BK\4_2024-04-19.md'


2025-11-14 15:43:59,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,395 - INFO - Going to convert document batch...
2025-11-14 15:43:59,396 - INFO - Processing document 4_2024-04-23
2025-11-14 15:43:59,414 - INFO - Finished converting document 4_2024-04-23 in 0.03 sec.
2025-11-14 15:43:59,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,453 - INFO - Going to convert document batch...
2025-11-14 15:43:59,454 - INFO - Processing document 4_2024-05-09
2025-11-14 15:43:59,473 - INFO - Finished converting document 4_2024-05-09 in 0.03 sec.
2025-11-14 15:43:59,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,512 - INFO - Going to convert document batch...
2025-11-14 15:43:59,514 - INFO - Processing document 4_2024-07-03
2025-11-14 15:43:59,530 - INFO - Finished converting document 4_2024-07-03 in 0.03 sec.
2025-11-14 15:43:59,562 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BK\4_2024-04-22' --> 'data\processed_data\BK\4_2024-04-22.md'
Converted 'data\edgar_documents\BK\4_2024-04-23' --> 'data\processed_data\BK\4_2024-04-23.md'
Converted 'data\edgar_documents\BK\4_2024-05-09' --> 'data\processed_data\BK\4_2024-05-09.md'
Converted 'data\edgar_documents\BK\4_2024-07-03' --> 'data\processed_data\BK\4_2024-07-03.md'


2025-11-14 15:43:59,563 - ERROR - Input document 4_2024-07-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:59,564 - INFO - Going to convert document batch...
2025-11-14 15:43:59,580 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:43:59,580 - ERROR - Input document 4_2024-07-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\BK\4_2024-07-15: File format not allowed: data\edgar_documents\BK\4_2024-07-15
Error processing data\edgar_documents\BK\4_2024-07-17: File format not allowed: data\edgar_documents\BK\4_2024-07-17
Converted 'data\edgar_documents\BK\4_2024-07-19' --> 'data\processed_data\BK\4_2024-07-19.md'
Converted 'data\edgar_documents\BK\4_2024-10-03' --> 'data\processed_data\BK\4_2024-10-03.md'


2025-11-14 15:43:59,749 - INFO - Processing document 4_2024-10-17
2025-11-14 15:43:59,767 - INFO - Finished converting document 4_2024-10-17 in 0.06 sec.
2025-11-14 15:43:59,801 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:43:59,802 - ERROR - Input document 4_2024-11-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:59,803 - INFO - Going to convert document batch...
2025-11-14 15:43:59,815 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\BK\4_2024-10-17' --> 'data\processed_data\BK\4_2024-10-17.md'
Error processing data\edgar_documents\BK\4_2024-11-13: File format not allowed: data\edgar_documents\BK\4_2024-11-13
Error processing data\edgar_documents\BK\4_2024-11-14: File format not allowed: data\edgar_documents\BK\4_2024-11-14
Error processing data\edgar_documents\BK\4_2024-12-10: File format not allowed: data\edgar_documents\BK\4_2024-12-10
Converted 'data\edgar_documents\BK\4_2025-02-05' --> 'data\processed_data\BK\4_2025-02-05.md'
Converted 'data\edgar_documents\BK\4_2025-02-19' --> 'data\processed_data\BK\4_2025-02-19.md'


2025-11-14 15:43:59,987 - INFO - Going to convert document batch...
2025-11-14 15:43:59,988 - INFO - Processing document 4_2025-02-28
2025-11-14 15:44:00,008 - INFO - Finished converting document 4_2025-02-28 in 0.03 sec.
2025-11-14 15:44:00,053 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:44:00,053 - ERROR - Input document 4_2025-03-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:44:00,055 - INFO - Going to convert document batch...
2025-11-14 15:44:00,067 - IN

Converted 'data\edgar_documents\BK\4_2025-02-28' --> 'data\processed_data\BK\4_2025-02-28.md'
Error processing data\edgar_documents\BK\4_2025-03-03: File format not allowed: data\edgar_documents\BK\4_2025-03-03
Converted 'data\edgar_documents\BK\4_2025-03-04' --> 'data\processed_data\BK\4_2025-03-04.md'
Error processing data\edgar_documents\BK\4_2025-03-05: File format not allowed: data\edgar_documents\BK\4_2025-03-05
Error processing data\edgar_documents\BK\4_2025-03-07: File format not allowed: data\edgar_documents\BK\4_2025-03-07
Error processing data\edgar_documents\BK\4_2025-03-11: File format not allowed: data\edgar_documents\BK\4_2025-03-11


2025-11-14 15:44:00,224 - INFO - Going to convert document batch...
2025-11-14 15:44:00,225 - INFO - Processing document 4_2025-04-02
2025-11-14 15:44:00,283 - INFO - Finished converting document 4_2025-04-02 in 0.08 sec.
2025-11-14 15:44:00,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,332 - INFO - Going to convert document batch...
2025-11-14 15:44:00,333 - INFO - Processing document 4_2025-04-16
2025-11-14 15:44:00,350 - INFO - Finished converting document 4_2025-04-16 in 0.03 sec.
2025-11-14 15:44:00,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,389 - INFO - Going to convert document batch...
2025-11-14 15:44:00,390 - INFO - Processing document 4_2025-04-23
2025-11-14 15:44:00,409 - INFO - Finished converting document 4_2025-04-23 in 0.05 sec.
2025-11-14 15:44:00,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,446 - INFO - Going to convert document batch...
2025-11-14 15:44:00,447 - 

Converted 'data\edgar_documents\BK\4_2025-04-02' --> 'data\processed_data\BK\4_2025-04-02.md'
Converted 'data\edgar_documents\BK\4_2025-04-16' --> 'data\processed_data\BK\4_2025-04-16.md'
Converted 'data\edgar_documents\BK\4_2025-04-23' --> 'data\processed_data\BK\4_2025-04-23.md'
Converted 'data\edgar_documents\BK\4_2025-05-01' --> 'data\processed_data\BK\4_2025-05-01.md'


2025-11-14 15:44:00,509 - ERROR - Input document 4_2025-06-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:44:00,511 - INFO - Going to convert document batch...
2025-11-14 15:44:00,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,535 - INFO - Going to convert document batch...
2025-11-14 15:44:00,537 - INFO - Processing document 4_2025-07-03
2025-11-14 15:44:00,555 - INFO - Finished converting document 4_2025-07-03 in 0.03 sec.
2025-11-14 15:44:00,585 - INFO - detec

Error processing data\edgar_documents\BK\4_2025-06-04: File format not allowed: data\edgar_documents\BK\4_2025-06-04
Converted 'data\edgar_documents\BK\4_2025-07-03' --> 'data\processed_data\BK\4_2025-07-03.md'
Converted 'data\edgar_documents\BK\4_2025-07-24' --> 'data\processed_data\BK\4_2025-07-24.md'
Error processing data\edgar_documents\BK\4_2025-09-03: File format not allowed: data\edgar_documents\BK\4_2025-09-03
Error processing data\edgar_documents\BK\4_2025-09-05: File format not allowed: data\edgar_documents\BK\4_2025-09-05


2025-11-14 15:44:00,708 - INFO - Processing document 4_2025-10-03
2025-11-14 15:44:00,725 - INFO - Finished converting document 4_2025-10-03 in 0.03 sec.
2025-11-14 15:44:00,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,765 - INFO - Going to convert document batch...
2025-11-14 15:44:00,765 - INFO - Processing document 4_2025-11-03
2025-11-14 15:44:00,783 - INFO - Finished converting document 4_2025-11-03 in 0.03 sec.
2025-11-14 15:44:00,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,819 - INFO - Going to convert document batch...
2025-11-14 15:44:00,820 - INFO - Processing document 4_2025-11-07
2025-11-14 15:44:00,839 - INFO - Finished converting document 4_2025-11-07 in 0.05 sec.
2025-11-14 15:44:00,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,885 - INFO - Going to convert document batch...
2025-11-14 15:44:00,886 - INFO - Processing document 8-K_2023-01-13
2025-11-14 15:44:00,907 - 

Converted 'data\edgar_documents\BK\4_2025-10-03' --> 'data\processed_data\BK\4_2025-10-03.md'
Converted 'data\edgar_documents\BK\4_2025-11-03' --> 'data\processed_data\BK\4_2025-11-03.md'
Converted 'data\edgar_documents\BK\4_2025-11-07' --> 'data\processed_data\BK\4_2025-11-07.md'
Converted 'data\edgar_documents\BK\8-K_2023-01-13' --> 'data\processed_data\BK\8-K_2023-01-13.md'


2025-11-14 15:44:00,946 - INFO - Going to convert document batch...
2025-11-14 15:44:00,947 - INFO - Processing document 8-K_2023-01-31
2025-11-14 15:44:00,966 - INFO - Finished converting document 8-K_2023-01-31 in 0.05 sec.
2025-11-14 15:44:00,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,011 - INFO - Going to convert document batch...
2025-11-14 15:44:01,011 - INFO - Processing document 8-K_2023-04-12
2025-11-14 15:44:01,038 - INFO - Finished converting document 8-K_2023-04-12 in 0.06 sec.
2025-11-14 15:44:01,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,078 - INFO - Going to convert document batch...
2025-11-14 15:44:01,080 - INFO - Processing document 8-K_2023-04-18
2025-11-14 15:44:01,098 - INFO - Finished converting document 8-K_2023-04-18 in 0.05 sec.
2025-11-14 15:44:01,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,164 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2023-01-31' --> 'data\processed_data\BK\8-K_2023-01-31.md'
Converted 'data\edgar_documents\BK\8-K_2023-04-12' --> 'data\processed_data\BK\8-K_2023-04-12.md'
Converted 'data\edgar_documents\BK\8-K_2023-04-18' --> 'data\processed_data\BK\8-K_2023-04-18.md'


2025-11-14 15:44:01,164 - INFO - Processing document 8-K_2023-04-26
2025-11-14 15:44:01,182 - INFO - Finished converting document 8-K_2023-04-26 in 0.08 sec.
2025-11-14 15:44:01,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,215 - INFO - Going to convert document batch...
2025-11-14 15:44:01,216 - INFO - Processing document 8-K_2023-05-24
2025-11-14 15:44:01,233 - INFO - Finished converting document 8-K_2023-05-24 in 0.05 sec.
2025-11-14 15:44:01,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,264 - INFO - Going to convert document batch...
2025-11-14 15:44:01,265 - INFO - Processing document 8-K_2023-06-30
2025-11-14 15:44:01,277 - INFO - Finished converting document 8-K_2023-06-30 in 0.05 sec.
2025-11-14 15:44:01,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,311 - INFO - Going to convert document batch...
2025-11-14 15:44:01,312 - INFO - Processing document 8-K_2023-07-18
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2023-04-26' --> 'data\processed_data\BK\8-K_2023-04-26.md'
Converted 'data\edgar_documents\BK\8-K_2023-05-24' --> 'data\processed_data\BK\8-K_2023-05-24.md'
Converted 'data\edgar_documents\BK\8-K_2023-06-30' --> 'data\processed_data\BK\8-K_2023-06-30.md'
Converted 'data\edgar_documents\BK\8-K_2023-07-18' --> 'data\processed_data\BK\8-K_2023-07-18.md'


2025-11-14 15:44:01,375 - INFO - Processing document 8-K_2023-08-11
2025-11-14 15:44:01,399 - INFO - Finished converting document 8-K_2023-08-11 in 0.05 sec.
2025-11-14 15:44:01,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,436 - INFO - Going to convert document batch...
2025-11-14 15:44:01,437 - INFO - Processing document 8-K_2023-09-05
2025-11-14 15:44:01,456 - INFO - Finished converting document 8-K_2023-09-05 in 0.05 sec.
2025-11-14 15:44:01,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,490 - INFO - Going to convert document batch...
2025-11-14 15:44:01,491 - INFO - Processing document 8-K_2023-09-12
2025-11-14 15:44:01,510 - INFO - Finished converting document 8-K_2023-09-12 in 0.05 sec.
2025-11-14 15:44:01,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,548 - INFO - Going to convert document batch...
2025-11-14 15:44:01,549 - INFO - Processing document 8-K_2023-10-17
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2023-08-11' --> 'data\processed_data\BK\8-K_2023-08-11.md'
Converted 'data\edgar_documents\BK\8-K_2023-09-05' --> 'data\processed_data\BK\8-K_2023-09-05.md'
Converted 'data\edgar_documents\BK\8-K_2023-09-12' --> 'data\processed_data\BK\8-K_2023-09-12.md'
Converted 'data\edgar_documents\BK\8-K_2023-10-17' --> 'data\processed_data\BK\8-K_2023-10-17.md'


2025-11-14 15:44:01,606 - INFO - Going to convert document batch...
2025-11-14 15:44:01,607 - INFO - Processing document 8-K_2023-10-25
2025-11-14 15:44:01,627 - INFO - Finished converting document 8-K_2023-10-25 in 0.05 sec.
2025-11-14 15:44:01,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,659 - INFO - Going to convert document batch...
2025-11-14 15:44:01,660 - INFO - Processing document 8-K_2023-11-17
2025-11-14 15:44:01,675 - INFO - Finished converting document 8-K_2023-11-17 in 0.03 sec.
2025-11-14 15:44:01,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,708 - INFO - Going to convert document batch...
2025-11-14 15:44:01,708 - INFO - Processing document 8-K_2023-12-21
2025-11-14 15:44:01,725 - INFO - Finished converting document 8-K_2023-12-21 in 0.03 sec.
2025-11-14 15:44:01,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,761 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2023-10-25' --> 'data\processed_data\BK\8-K_2023-10-25.md'
Converted 'data\edgar_documents\BK\8-K_2023-11-17' --> 'data\processed_data\BK\8-K_2023-11-17.md'
Converted 'data\edgar_documents\BK\8-K_2023-12-21' --> 'data\processed_data\BK\8-K_2023-12-21.md'
Converted 'data\edgar_documents\BK\8-K_2024-01-12' --> 'data\processed_data\BK\8-K_2024-01-12.md'


2025-11-14 15:44:01,853 - INFO - Going to convert document batch...
2025-11-14 15:44:01,854 - INFO - Processing document 8-K_2024-03-05
2025-11-14 15:44:01,867 - INFO - Finished converting document 8-K_2024-03-05 in 0.06 sec.
2025-11-14 15:44:01,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,931 - INFO - Going to convert document batch...
2025-11-14 15:44:01,931 - INFO - Processing document 8-K_2024-03-14
2025-11-14 15:44:01,947 - INFO - Finished converting document 8-K_2024-03-14 in 0.06 sec.
2025-11-14 15:44:01,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,978 - INFO - Going to convert document batch...
2025-11-14 15:44:01,980 - INFO - Processing document 8-K_2024-03-26
2025-11-14 15:44:01,995 - INFO - Finished converting document 8-K_2024-03-26 in 0.05 sec.
2025-11-14 15:44:02,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,033 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2024-03-05' --> 'data\processed_data\BK\8-K_2024-03-05.md'
Converted 'data\edgar_documents\BK\8-K_2024-03-14' --> 'data\processed_data\BK\8-K_2024-03-14.md'
Converted 'data\edgar_documents\BK\8-K_2024-03-26' --> 'data\processed_data\BK\8-K_2024-03-26.md'


2025-11-14 15:44:02,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,096 - INFO - Going to convert document batch...
2025-11-14 15:44:02,097 - INFO - Processing document 8-K_2024-04-16
2025-11-14 15:44:02,116 - INFO - Finished converting document 8-K_2024-04-16 in 0.05 sec.
2025-11-14 15:44:02,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,176 - INFO - Going to convert document batch...
2025-11-14 15:44:02,177 - INFO - Processing document 8-K_2024-06-18
2025-11-14 15:44:02,191 - INFO - Finished converting document 8-K_2024-06-18 in 0.06 sec.
2025-11-14 15:44:02,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,250 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2024-04-10' --> 'data\processed_data\BK\8-K_2024-04-10.md'
Converted 'data\edgar_documents\BK\8-K_2024-04-16' --> 'data\processed_data\BK\8-K_2024-04-16.md'
Converted 'data\edgar_documents\BK\8-K_2024-06-18' --> 'data\processed_data\BK\8-K_2024-06-18.md'


2025-11-14 15:44:02,251 - INFO - Processing document 8-K_2024-06-28
2025-11-14 15:44:02,265 - INFO - Finished converting document 8-K_2024-06-28 in 0.06 sec.
2025-11-14 15:44:02,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,323 - INFO - Going to convert document batch...
2025-11-14 15:44:02,325 - INFO - Processing document 8-K_2024-07-12
2025-11-14 15:44:02,362 - INFO - Finished converting document 8-K_2024-07-12 in 0.09 sec.
2025-11-14 15:44:02,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,399 - INFO - Going to convert document batch...
2025-11-14 15:44:02,400 - INFO - Processing document 8-K_2024-07-22
2025-11-14 15:44:02,417 - INFO - Finished converting document 8-K_2024-07-22 in 0.05 sec.
2025-11-14 15:44:02,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,450 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2024-06-28' --> 'data\processed_data\BK\8-K_2024-06-28.md'
Converted 'data\edgar_documents\BK\8-K_2024-07-12' --> 'data\processed_data\BK\8-K_2024-07-12.md'
Converted 'data\edgar_documents\BK\8-K_2024-07-22' --> 'data\processed_data\BK\8-K_2024-07-22.md'


2025-11-14 15:44:02,451 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:44:02,470 - INFO - Finished converting document 8-K_2024-10-11 in 0.05 sec.
2025-11-14 15:44:02,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,509 - INFO - Going to convert document batch...
2025-11-14 15:44:02,510 - INFO - Processing document 8-K_2024-11-20
2025-11-14 15:44:02,528 - INFO - Finished converting document 8-K_2024-11-20 in 0.05 sec.
2025-11-14 15:44:02,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,559 - INFO - Going to convert document batch...
2025-11-14 15:44:02,560 - INFO - Processing document 8-K_2024-12-05
2025-11-14 15:44:02,575 - INFO - Finished converting document 8-K_2024-12-05 in 0.05 sec.
2025-11-14 15:44:02,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,604 - INFO - Going to convert document batch...
2025-11-14 15:44:02,605 - INFO - Processing document 8-K_2025-01-08
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2024-10-11' --> 'data\processed_data\BK\8-K_2024-10-11.md'
Converted 'data\edgar_documents\BK\8-K_2024-11-20' --> 'data\processed_data\BK\8-K_2024-11-20.md'
Converted 'data\edgar_documents\BK\8-K_2024-12-05' --> 'data\processed_data\BK\8-K_2024-12-05.md'
Converted 'data\edgar_documents\BK\8-K_2025-01-08' --> 'data\processed_data\BK\8-K_2025-01-08.md'


2025-11-14 15:44:02,674 - INFO - Finished converting document 8-K_2025-01-15 in 0.05 sec.
2025-11-14 15:44:02,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,712 - INFO - Going to convert document batch...
2025-11-14 15:44:02,713 - INFO - Processing document 8-K_2025-02-11
2025-11-14 15:44:02,729 - INFO - Finished converting document 8-K_2025-02-11 in 0.05 sec.
2025-11-14 15:44:02,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,763 - INFO - Going to convert document batch...
2025-11-14 15:44:02,764 - INFO - Processing document 8-K_2025-03-03


Converted 'data\edgar_documents\BK\8-K_2025-01-15' --> 'data\processed_data\BK\8-K_2025-01-15.md'
Converted 'data\edgar_documents\BK\8-K_2025-02-11' --> 'data\processed_data\BK\8-K_2025-02-11.md'


2025-11-14 15:44:03,014 - INFO - Finished converting document 8-K_2025-03-03 in 0.28 sec.
2025-11-14 15:44:03,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,077 - INFO - Going to convert document batch...
2025-11-14 15:44:03,077 - INFO - Processing document 8-K_2025-03-10
2025-11-14 15:44:03,099 - INFO - Finished converting document 8-K_2025-03-10 in 0.08 sec.
2025-11-14 15:44:03,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,140 - INFO - Going to convert document batch...
2025-11-14 15:44:03,141 - INFO - Processing document 8-K_2025-03-14
2025-11-14 15:44:03,164 - INFO - Finished converting document 8-K_2025-03-14 in 0.05 sec.
2025-11-14 15:44:03,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,205 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2025-03-03' --> 'data\processed_data\BK\8-K_2025-03-03.md'
Converted 'data\edgar_documents\BK\8-K_2025-03-10' --> 'data\processed_data\BK\8-K_2025-03-10.md'
Converted 'data\edgar_documents\BK\8-K_2025-03-14' --> 'data\processed_data\BK\8-K_2025-03-14.md'


2025-11-14 15:44:03,206 - INFO - Processing document 8-K_2025-04-11
2025-11-14 15:44:03,226 - INFO - Finished converting document 8-K_2025-04-11 in 0.05 sec.
2025-11-14 15:44:03,257 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,271 - INFO - Going to convert document batch...
2025-11-14 15:44:03,272 - INFO - Processing document 8-K_2025-04-16
2025-11-14 15:44:03,295 - INFO - Finished converting document 8-K_2025-04-16 in 0.06 sec.
2025-11-14 15:44:03,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,370 - INFO - Going to convert document batch...
2025-11-14 15:44:03,371 - INFO - Processing document 8-K_2025-06-10
2025-11-14 15:44:03,389 - INFO - Finished converting document 8-K_2025-06-10 in 0.08 sec.
2025-11-14 15:44:03,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,421 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2025-04-11' --> 'data\processed_data\BK\8-K_2025-04-11.md'
Converted 'data\edgar_documents\BK\8-K_2025-04-16' --> 'data\processed_data\BK\8-K_2025-04-16.md'
Converted 'data\edgar_documents\BK\8-K_2025-06-10' --> 'data\processed_data\BK\8-K_2025-06-10.md'


2025-11-14 15:44:03,422 - INFO - Processing document 8-K_2025-06-12
2025-11-14 15:44:03,439 - INFO - Finished converting document 8-K_2025-06-12 in 0.05 sec.
2025-11-14 15:44:03,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,472 - INFO - Going to convert document batch...
2025-11-14 15:44:03,473 - INFO - Processing document 8-K_2025-07-01
2025-11-14 15:44:03,489 - INFO - Finished converting document 8-K_2025-07-01 in 0.03 sec.
2025-11-14 15:44:03,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,520 - INFO - Going to convert document batch...
2025-11-14 15:44:03,521 - INFO - Processing document 8-K_2025-07-15
2025-11-14 15:44:03,541 - INFO - Finished converting document 8-K_2025-07-15 in 0.03 sec.
2025-11-14 15:44:03,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,579 - INFO - Going to convert document batch...
2025-11-14 15:44:03,580 - INFO - Processing document 8-K_2025-09-03
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2025-06-12' --> 'data\processed_data\BK\8-K_2025-06-12.md'
Converted 'data\edgar_documents\BK\8-K_2025-07-01' --> 'data\processed_data\BK\8-K_2025-07-01.md'
Converted 'data\edgar_documents\BK\8-K_2025-07-15' --> 'data\processed_data\BK\8-K_2025-07-15.md'
Converted 'data\edgar_documents\BK\8-K_2025-09-03' --> 'data\processed_data\BK\8-K_2025-09-03.md'


2025-11-14 15:44:03,665 - INFO - Going to convert document batch...
2025-11-14 15:44:03,665 - INFO - Processing document 8-K_2025-09-10
2025-11-14 15:44:03,689 - INFO - Finished converting document 8-K_2025-09-10 in 0.08 sec.
2025-11-14 15:44:03,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,727 - INFO - Going to convert document batch...
2025-11-14 15:44:03,728 - INFO - Processing document 8-K_2025-09-11
2025-11-14 15:44:03,745 - INFO - Finished converting document 8-K_2025-09-11 in 0.05 sec.
2025-11-14 15:44:03,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,778 - INFO - Going to convert document batch...
2025-11-14 15:44:03,779 - INFO - Processing document 8-K_2025-09-23
2025-11-14 15:44:03,796 - INFO - Finished converting document 8-K_2025-09-23 in 0.05 sec.
2025-11-14 15:44:03,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,861 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2025-09-10' --> 'data\processed_data\BK\8-K_2025-09-10.md'
Converted 'data\edgar_documents\BK\8-K_2025-09-11' --> 'data\processed_data\BK\8-K_2025-09-11.md'
Converted 'data\edgar_documents\BK\8-K_2025-09-23' --> 'data\processed_data\BK\8-K_2025-09-23.md'


2025-11-14 15:44:03,935 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:44:03,936 - ERROR - Input document DEF-14A_2023-03-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:44:03,939 - INFO - Going to convert document batch...
2025-11-14 15:44:03,975 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:44:03,976 - ERROR - Input document DEF-14A_2024-02-29 with format No

Converted 'data\edgar_documents\BK\8-K_2025-10-16' --> 'data\processed_data\BK\8-K_2025-10-16.md'
Error processing data\edgar_documents\BK\DEF-14A_2023-03-01: File format not allowed: data\edgar_documents\BK\DEF-14A_2023-03-01
Error processing data\edgar_documents\BK\DEF-14A_2024-02-29: File format not allowed: data\edgar_documents\BK\DEF-14A_2024-02-29
Error processing data\edgar_documents\BK\DEF-14A_2025-03-05: File format not allowed: data\edgar_documents\BK\DEF-14A_2025-03-05
Processed 107 new files. Errors: 21
Found 124 files to process in data\edgar_documents\BKNG


2025-11-14 15:44:04,854 - INFO - Going to convert document batch...
2025-11-14 15:44:04,855 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:44:04,855 - INFO - Processing document 10-K_2023-02-23
2025-11-14 15:44:06,848 - INFO - Finished converting document 10-K_2023-02-23 in 2.83 sec.
2025-11-14 15:44:07,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-K_2023-02-23' --> 'data\processed_data\BKNG\10-K_2023-02-23.md'


2025-11-14 15:44:08,267 - INFO - Going to convert document batch...
2025-11-14 15:44:08,268 - INFO - Processing document 10-K_2024-02-22
2025-11-14 15:44:13,205 - INFO - Finished converting document 10-K_2024-02-22 in 5.81 sec.
2025-11-14 15:44:15,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-K_2024-02-22' --> 'data\processed_data\BKNG\10-K_2024-02-22.md'


2025-11-14 15:44:16,945 - INFO - Going to convert document batch...
2025-11-14 15:44:16,947 - INFO - Processing document 10-K_2025-02-20
2025-11-14 15:44:23,699 - INFO - Finished converting document 10-K_2025-02-20 in 8.75 sec.
2025-11-14 15:44:25,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-K_2025-02-20' --> 'data\processed_data\BKNG\10-K_2025-02-20.md'


2025-11-14 15:44:27,159 - INFO - Going to convert document batch...
2025-11-14 15:44:27,160 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 15:44:29,246 - INFO - Finished converting document 10-Q_2023-05-04 in 3.72 sec.
2025-11-14 15:44:30,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2023-05-04' --> 'data\processed_data\BKNG\10-Q_2023-05-04.md'


2025-11-14 15:44:33,177 - INFO - Going to convert document batch...
2025-11-14 15:44:33,181 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 15:44:35,462 - INFO - Finished converting document 10-Q_2023-08-03 in 4.84 sec.
2025-11-14 15:44:36,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2023-08-03' --> 'data\processed_data\BKNG\10-Q_2023-08-03.md'


2025-11-14 15:44:38,390 - INFO - Going to convert document batch...
2025-11-14 15:44:38,392 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 15:44:41,114 - INFO - Finished converting document 10-Q_2023-11-02 in 4.26 sec.
2025-11-14 15:44:42,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2023-11-02' --> 'data\processed_data\BKNG\10-Q_2023-11-02.md'


2025-11-14 15:44:44,063 - INFO - Going to convert document batch...
2025-11-14 15:44:44,064 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 15:44:46,084 - INFO - Finished converting document 10-Q_2024-05-02 in 3.83 sec.
2025-11-14 15:44:47,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2024-05-02' --> 'data\processed_data\BKNG\10-Q_2024-05-02.md'


2025-11-14 15:44:49,403 - INFO - Going to convert document batch...
2025-11-14 15:44:49,406 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 15:44:52,075 - INFO - Finished converting document 10-Q_2024-08-01 in 4.80 sec.
2025-11-14 15:44:53,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2024-08-01' --> 'data\processed_data\BKNG\10-Q_2024-08-01.md'


2025-11-14 15:44:54,532 - INFO - Going to convert document batch...
2025-11-14 15:44:54,534 - INFO - Processing document 10-Q_2024-10-30
2025-11-14 15:44:56,794 - INFO - Finished converting document 10-Q_2024-10-30 in 3.50 sec.
2025-11-14 15:44:57,993 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2024-10-30' --> 'data\processed_data\BKNG\10-Q_2024-10-30.md'


2025-11-14 15:44:59,994 - INFO - Going to convert document batch...
2025-11-14 15:44:59,996 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 15:45:02,117 - INFO - Finished converting document 10-Q_2025-04-29 in 4.16 sec.
2025-11-14 15:45:03,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2025-04-29' --> 'data\processed_data\BKNG\10-Q_2025-04-29.md'


2025-11-14 15:45:04,655 - INFO - Going to convert document batch...
2025-11-14 15:45:04,657 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 15:45:07,862 - INFO - Finished converting document 10-Q_2025-07-29 in 4.69 sec.
2025-11-14 15:45:09,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2025-07-29' --> 'data\processed_data\BKNG\10-Q_2025-07-29.md'


2025-11-14 15:45:10,508 - INFO - Going to convert document batch...
2025-11-14 15:45:10,510 - INFO - Processing document 10-Q_2025-10-28
2025-11-14 15:45:12,970 - INFO - Finished converting document 10-Q_2025-10-28 in 3.78 sec.
2025-11-14 15:45:14,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:14,294 - INFO - Going to convert document batch...
2025-11-14 15:45:14,296 - INFO - Processing document 4_2023-01-19
2025-11-14 15:45:14,416 - INFO - Finished converting document 4_2023-01-19 in 0.19 sec.


Converted 'data\edgar_documents\BKNG\10-Q_2025-10-28' --> 'data\processed_data\BKNG\10-Q_2025-10-28.md'


2025-11-14 15:45:14,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:14,577 - INFO - Going to convert document batch...
2025-11-14 15:45:14,585 - INFO - Processing document 4_2023-02-17
2025-11-14 15:45:14,637 - INFO - Finished converting document 4_2023-02-17 in 0.11 sec.
2025-11-14 15:45:14,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-01-19' --> 'data\processed_data\BKNG\4_2023-01-19.md'
Converted 'data\edgar_documents\BKNG\4_2023-02-17' --> 'data\processed_data\BKNG\4_2023-02-17.md'


2025-11-14 15:45:14,749 - INFO - Going to convert document batch...
2025-11-14 15:45:14,750 - INFO - Processing document 4_2023-03-06
2025-11-14 15:45:14,826 - INFO - Finished converting document 4_2023-03-06 in 0.14 sec.
2025-11-14 15:45:14,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:14,918 - INFO - Going to convert document batch...
2025-11-14 15:45:14,919 - INFO - Processing document 4_2023-03-08
2025-11-14 15:45:14,953 - INFO - Finished converting document 4_2023-03-08 in 0.08 sec.
2025-11-14 15:45:15,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-03-06' --> 'data\processed_data\BKNG\4_2023-03-06.md'
Converted 'data\edgar_documents\BKNG\4_2023-03-08' --> 'data\processed_data\BKNG\4_2023-03-08.md'


2025-11-14 15:45:15,067 - INFO - Going to convert document batch...
2025-11-14 15:45:15,070 - INFO - Processing document 4_2023-03-10
2025-11-14 15:45:15,132 - INFO - Finished converting document 4_2023-03-10 in 0.11 sec.
2025-11-14 15:45:15,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,200 - INFO - Going to convert document batch...
2025-11-14 15:45:15,202 - INFO - Processing document 4_2023-03-17
2025-11-14 15:45:15,259 - INFO - Finished converting document 4_2023-03-17 in 0.08 sec.


Converted 'data\edgar_documents\BKNG\4_2023-03-10' --> 'data\processed_data\BKNG\4_2023-03-10.md'
Converted 'data\edgar_documents\BKNG\4_2023-03-17' --> 'data\processed_data\BKNG\4_2023-03-17.md'


2025-11-14 15:45:15,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,388 - INFO - Going to convert document batch...
2025-11-14 15:45:15,390 - INFO - Processing document 4_2023-04-18
2025-11-14 15:45:15,428 - INFO - Finished converting document 4_2023-04-18 in 0.09 sec.
2025-11-14 15:45:15,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,520 - INFO - Going to convert document batch...
2025-11-14 15:45:15,521 - INFO - Processing document 4_2023-04-19
2025-11-14 15:45:15,565 - INFO - Finished converting document 4_2023-04-19 in 0.08 sec.
2025-11-14 15:45:15,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,647 - INFO - Going to convert document batch...
2025-11-14 15:45:15,648 - INFO - Processing document 4_2023-05-02


Converted 'data\edgar_documents\BKNG\4_2023-04-18' --> 'data\processed_data\BKNG\4_2023-04-18.md'
Converted 'data\edgar_documents\BKNG\4_2023-04-19' --> 'data\processed_data\BKNG\4_2023-04-19.md'


2025-11-14 15:45:15,683 - INFO - Finished converting document 4_2023-05-02 in 0.08 sec.
2025-11-14 15:45:15,773 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:15,773 - ERROR - Input document 4_2023-05-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:15,775 - INFO - Going to convert document batch...
2025-11-14 15:45:15,803 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:15,804 - ERROR - Input document 4_2023-05-10 with forma

Converted 'data\edgar_documents\BKNG\4_2023-05-02' --> 'data\processed_data\BKNG\4_2023-05-02.md'
Error processing data\edgar_documents\BKNG\4_2023-05-09: File format not allowed: data\edgar_documents\BKNG\4_2023-05-09
Error processing data\edgar_documents\BKNG\4_2023-05-10: File format not allowed: data\edgar_documents\BKNG\4_2023-05-10


2025-11-14 15:45:15,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,991 - INFO - Going to convert document batch...
2025-11-14 15:45:15,993 - INFO - Processing document 4_2023-05-31
2025-11-14 15:45:16,032 - INFO - Finished converting document 4_2023-05-31 in 0.08 sec.
2025-11-14 15:45:16,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-05-16' --> 'data\processed_data\BKNG\4_2023-05-16.md'
Converted 'data\edgar_documents\BKNG\4_2023-05-31' --> 'data\processed_data\BKNG\4_2023-05-31.md'


2025-11-14 15:45:16,144 - INFO - Going to convert document batch...
2025-11-14 15:45:16,145 - INFO - Processing document 4_2023-06-16
2025-11-14 15:45:17,079 - INFO - Finished converting document 4_2023-06-16 in 0.98 sec.
2025-11-14 15:45:17,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,176 - INFO - Going to convert document batch...
2025-11-14 15:45:17,177 - INFO - Processing document 4_2023-07-18
2025-11-14 15:45:17,230 - INFO - Finished converting document 4_2023-07-18 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2023-06-16' --> 'data\processed_data\BKNG\4_2023-06-16.md'
Converted 'data\edgar_documents\BKNG\4_2023-07-18' --> 'data\processed_data\BKNG\4_2023-07-18.md'


2025-11-14 15:45:17,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,322 - INFO - Going to convert document batch...
2025-11-14 15:45:17,323 - INFO - Processing document 4_2023-08-09
2025-11-14 15:45:17,357 - INFO - Finished converting document 4_2023-08-09 in 0.08 sec.
2025-11-14 15:45:17,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,423 - INFO - Going to convert document batch...
2025-11-14 15:45:17,424 - INFO - Processing document 4_2023-08-10
2025-11-14 15:45:17,450 - INFO - Finished converting document 4_2023-08-10 in 0.06 sec.
2025-11-14 15:45:17,560 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-08-09' --> 'data\processed_data\BKNG\4_2023-08-09.md'
Converted 'data\edgar_documents\BKNG\4_2023-08-10' --> 'data\processed_data\BKNG\4_2023-08-10.md'


2025-11-14 15:45:17,588 - INFO - Going to convert document batch...
2025-11-14 15:45:17,590 - INFO - Processing document 4_2023-08-14
2025-11-14 15:45:17,653 - INFO - Finished converting document 4_2023-08-14 in 0.12 sec.
2025-11-14 15:45:17,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,732 - INFO - Going to convert document batch...
2025-11-14 15:45:17,733 - INFO - Processing document 4_2023-08-16
2025-11-14 15:45:17,764 - INFO - Finished converting document 4_2023-08-16 in 0.06 sec.
2025-11-14 15:45:17,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,835 - INFO - Going to convert document batch...
2025-11-14 15:45:17,837 - INFO - Processing document 4_2023-08-28
2025-11-14 15:45:17,871 - INFO - Finished converting document 4_2023-08-28 in 0.08 sec.


Converted 'data\edgar_documents\BKNG\4_2023-08-14' --> 'data\processed_data\BKNG\4_2023-08-14.md'
Converted 'data\edgar_documents\BKNG\4_2023-08-16' --> 'data\processed_data\BKNG\4_2023-08-16.md'


2025-11-14 15:45:17,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,950 - INFO - Going to convert document batch...
2025-11-14 15:45:17,952 - INFO - Processing document 4_2023-09-01
2025-11-14 15:45:18,028 - INFO - Finished converting document 4_2023-09-01 in 0.12 sec.


Converted 'data\edgar_documents\BKNG\4_2023-08-28' --> 'data\processed_data\BKNG\4_2023-08-28.md'


2025-11-14 15:45:18,114 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,140 - INFO - Going to convert document batch...
2025-11-14 15:45:18,141 - INFO - Processing document 4_2023-09-12
2025-11-14 15:45:18,184 - INFO - Finished converting document 4_2023-09-12 in 0.09 sec.
2025-11-14 15:45:18,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,272 - INFO - Going to convert document batch...
2025-11-14 15:45:18,273 - INFO - Processing document 4_2023-09-18


Converted 'data\edgar_documents\BKNG\4_2023-09-01' --> 'data\processed_data\BKNG\4_2023-09-01.md'
Converted 'data\edgar_documents\BKNG\4_2023-09-12' --> 'data\processed_data\BKNG\4_2023-09-12.md'


2025-11-14 15:45:18,355 - INFO - Finished converting document 4_2023-09-18 in 0.14 sec.
2025-11-14 15:45:18,432 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,463 - INFO - Going to convert document batch...
2025-11-14 15:45:18,464 - INFO - Processing document 4_2023-10-17
2025-11-14 15:45:18,578 - INFO - Finished converting document 4_2023-10-17 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\4_2023-09-18' --> 'data\processed_data\BKNG\4_2023-09-18.md'


2025-11-14 15:45:18,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,724 - INFO - Going to convert document batch...
2025-11-14 15:45:18,725 - INFO - Processing document 4_2023-11-13
2025-11-14 15:45:18,775 - INFO - Finished converting document 4_2023-11-13 in 0.09 sec.
2025-11-14 15:45:18,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,884 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BKNG\4_2023-10-17' --> 'data\processed_data\BKNG\4_2023-10-17.md'
Converted 'data\edgar_documents\BKNG\4_2023-11-13' --> 'data\processed_data\BKNG\4_2023-11-13.md'


2025-11-14 15:45:18,885 - INFO - Processing document 4_2023-11-16
2025-11-14 15:45:18,958 - INFO - Finished converting document 4_2023-11-16 in 0.12 sec.
2025-11-14 15:45:19,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:19,053 - INFO - Going to convert document batch...
2025-11-14 15:45:19,054 - INFO - Processing document 4_2023-12-12
2025-11-14 15:45:19,102 - INFO - Finished converting document 4_2023-12-12 in 0.08 sec.
2025-11-14 15:45:19,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-11-16' --> 'data\processed_data\BKNG\4_2023-11-16.md'
Converted 'data\edgar_documents\BKNG\4_2023-12-12' --> 'data\processed_data\BKNG\4_2023-12-12.md'


2025-11-14 15:45:19,233 - INFO - Going to convert document batch...
2025-11-14 15:45:19,234 - INFO - Processing document 4_2023-12-18
2025-11-14 15:45:19,301 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.
2025-11-14 15:45:19,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:19,461 - INFO - Going to convert document batch...
2025-11-14 15:45:19,464 - INFO - Processing document 4_2024-01-17


Converted 'data\edgar_documents\BKNG\4_2023-12-18' --> 'data\processed_data\BKNG\4_2023-12-18.md'


2025-11-14 15:45:19,574 - INFO - Finished converting document 4_2024-01-17 in 0.23 sec.
2025-11-14 15:45:19,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:19,677 - INFO - Going to convert document batch...
2025-11-14 15:45:19,680 - INFO - Processing document 4_2024-02-08
2025-11-14 15:45:19,716 - INFO - Finished converting document 4_2024-02-08 in 0.08 sec.
2025-11-14 15:45:19,779 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2024-01-17' --> 'data\processed_data\BKNG\4_2024-01-17.md'
Converted 'data\edgar_documents\BKNG\4_2024-02-08' --> 'data\processed_data\BKNG\4_2024-02-08.md'


2025-11-14 15:45:19,850 - INFO - Going to convert document batch...
2025-11-14 15:45:19,853 - INFO - Processing document 4_2024-02-16
2025-11-14 15:45:19,977 - INFO - Finished converting document 4_2024-02-16 in 0.22 sec.
2025-11-14 15:45:20,155 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:20,157 - ERROR - Input document 4_2024-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:20,162 - INFO - Going to convert document batch...
2025-11-14 15:45:20,225 - IN

Converted 'data\edgar_documents\BKNG\4_2024-02-16' --> 'data\processed_data\BKNG\4_2024-02-16.md'
Error processing data\edgar_documents\BKNG\4_2024-02-27: File format not allowed: data\edgar_documents\BKNG\4_2024-02-27
Error processing data\edgar_documents\BKNG\4_2024-02-28: File format not allowed: data\edgar_documents\BKNG\4_2024-02-28


2025-11-14 15:45:20,307 - INFO - Finished converting document 4_2024-03-05 in 0.08 sec.
2025-11-14 15:45:20,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:20,386 - INFO - Going to convert document batch...
2025-11-14 15:45:20,387 - INFO - Processing document 4_2024-03-08
2025-11-14 15:45:20,449 - INFO - Finished converting document 4_2024-03-08 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2024-03-05' --> 'data\processed_data\BKNG\4_2024-03-05.md'


2025-11-14 15:45:20,546 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:20,576 - INFO - Going to convert document batch...
2025-11-14 15:45:20,578 - INFO - Processing document 4_2024-03-18
2025-11-14 15:45:20,638 - INFO - Finished converting document 4_2024-03-18 in 0.11 sec.
2025-11-14 15:45:20,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2024-03-08' --> 'data\processed_data\BKNG\4_2024-03-08.md'
Converted 'data\edgar_documents\BKNG\4_2024-03-18' --> 'data\processed_data\BKNG\4_2024-03-18.md'


2025-11-14 15:45:20,754 - INFO - Going to convert document batch...
2025-11-14 15:45:20,756 - INFO - Processing document 4_2024-04-16
2025-11-14 15:45:20,859 - INFO - Finished converting document 4_2024-04-16 in 0.19 sec.
2025-11-14 15:45:20,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:20,949 - INFO - Going to convert document batch...
2025-11-14 15:45:20,950 - INFO - Processing document 4_2024-05-03
2025-11-14 15:45:21,049 - INFO - Finished converting document 4_2024-05-03 in 0.12 sec.


Converted 'data\edgar_documents\BKNG\4_2024-04-16' --> 'data\processed_data\BKNG\4_2024-04-16.md'
Converted 'data\edgar_documents\BKNG\4_2024-05-03' --> 'data\processed_data\BKNG\4_2024-05-03.md'


2025-11-14 15:45:21,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:21,164 - INFO - Going to convert document batch...
2025-11-14 15:45:21,167 - INFO - Processing document 4_2024-05-09
2025-11-14 15:45:21,239 - INFO - Finished converting document 4_2024-05-09 in 0.12 sec.
2025-11-14 15:45:21,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:21,360 - INFO - Going to convert document batch...
2025-11-14 15:45:21,363 - INFO - Processing document 4_2024-05-13
2025-11-14 15:45:21,430 - INFO - Finished converting document 4_2024-05-13 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2024-05-09' --> 'data\processed_data\BKNG\4_2024-05-09.md'
Converted 'data\edgar_documents\BKNG\4_2024-05-13' --> 'data\processed_data\BKNG\4_2024-05-13.md'


2025-11-14 15:45:21,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:21,601 - INFO - Going to convert document batch...
2025-11-14 15:45:21,603 - INFO - Processing document 4_2024-05-16
2025-11-14 15:45:21,720 - INFO - Finished converting document 4_2024-05-16 in 0.20 sec.
2025-11-14 15:45:21,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:21,853 - INFO - Going to convert document batch...
2025-11-14 15:45:21,855 - INFO - Processing document 4_2024-05-31
2025-11-14 15:45:21,917 - INFO - Finished converting document 4_2024-05-31 in 0.11 sec.
2025-11-14 15:45:22,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2024-05-16' --> 'data\processed_data\BKNG\4_2024-05-16.md'
Converted 'data\edgar_documents\BKNG\4_2024-05-31' --> 'data\processed_data\BKNG\4_2024-05-31.md'


2025-11-14 15:45:22,086 - INFO - Going to convert document batch...
2025-11-14 15:45:22,088 - INFO - Processing document 4_2024-06-18
2025-11-14 15:45:22,189 - INFO - Finished converting document 4_2024-06-18 in 0.22 sec.
2025-11-14 15:45:22,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:22,319 - INFO - Going to convert document batch...
2025-11-14 15:45:22,322 - INFO - Processing document 4_2024-07-16


Converted 'data\edgar_documents\BKNG\4_2024-06-18' --> 'data\processed_data\BKNG\4_2024-06-18.md'


2025-11-14 15:45:22,481 - INFO - Finished converting document 4_2024-07-16 in 0.23 sec.
2025-11-14 15:45:22,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:22,636 - INFO - Going to convert document batch...
2025-11-14 15:45:22,638 - INFO - Processing document 4_2024-08-13
2025-11-14 15:45:22,707 - INFO - Finished converting document 4_2024-08-13 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2024-07-16' --> 'data\processed_data\BKNG\4_2024-07-16.md'
Converted 'data\edgar_documents\BKNG\4_2024-08-13' --> 'data\processed_data\BKNG\4_2024-08-13.md'


2025-11-14 15:45:22,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:22,828 - INFO - Going to convert document batch...
2025-11-14 15:45:22,830 - INFO - Processing document 4_2024-08-16
2025-11-14 15:45:22,907 - INFO - Finished converting document 4_2024-08-16 in 0.14 sec.
2025-11-14 15:45:23,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,038 - INFO - Going to convert document batch...
2025-11-14 15:45:23,039 - INFO - Processing document 4_2024-08-28
2025-11-14 15:45:23,099 - INFO - Finished converting document 4_2024-08-28 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2024-08-16' --> 'data\processed_data\BKNG\4_2024-08-16.md'
Converted 'data\edgar_documents\BKNG\4_2024-08-28' --> 'data\processed_data\BKNG\4_2024-08-28.md'


2025-11-14 15:45:23,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,211 - INFO - Going to convert document batch...
2025-11-14 15:45:23,214 - INFO - Processing document 4_2024-11-13
2025-11-14 15:45:23,270 - INFO - Finished converting document 4_2024-11-13 in 0.11 sec.
2025-11-14 15:45:23,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,353 - INFO - Going to convert document batch...
2025-11-14 15:45:23,354 - INFO - Processing document 4_2024-11-15
2025-11-14 15:45:23,404 - INFO - Finished converting document 4_2024-11-15 in 0.09 sec.
2025-11-14 15:45:23,492 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:23,493 - ERROR - Input document 4_2024-11-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\BKNG\4_2024-11-13' --> 'data\processed_data\BKNG\4_2024-11-13.md'
Converted 'data\edgar_documents\BKNG\4_2024-11-15' --> 'data\processed_data\BKNG\4_2024-11-15.md'


2025-11-14 15:45:23,521 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:23,522 - ERROR - Input document 4_2024-11-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:23,524 - INFO - Going to convert document batch...
2025-11-14 15:45:23,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,566 - INFO - Going to convert document batch...
2025-11-14 15:45:23,568 - INFO - Processing document 4_2024-11-25
2025-11-14 15:45:23,619 - INFO - Fin

Error processing data\edgar_documents\BKNG\4_2024-11-18: File format not allowed: data\edgar_documents\BKNG\4_2024-11-18
Error processing data\edgar_documents\BKNG\4_2024-11-19: File format not allowed: data\edgar_documents\BKNG\4_2024-11-19
Converted 'data\edgar_documents\BKNG\4_2024-11-25' --> 'data\processed_data\BKNG\4_2024-11-25.md'


2025-11-14 15:45:23,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,714 - INFO - Going to convert document batch...
2025-11-14 15:45:23,716 - INFO - Processing document 4_2025-02-25
2025-11-14 15:45:23,787 - INFO - Finished converting document 4_2025-02-25 in 0.11 sec.
2025-11-14 15:45:23,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,890 - INFO - Going to convert document batch...
2025-11-14 15:45:23,891 - INFO - Processing document 4_2025-03-04
2025-11-14 15:45:23,984 - INFO - Finished converting document 4_2025-03-04 in 0.14 sec.


Converted 'data\edgar_documents\BKNG\4_2025-02-25' --> 'data\processed_data\BKNG\4_2025-02-25.md'
Converted 'data\edgar_documents\BKNG\4_2025-03-04' --> 'data\processed_data\BKNG\4_2025-03-04.md'


2025-11-14 15:45:24,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:24,122 - INFO - Going to convert document batch...
2025-11-14 15:45:24,124 - INFO - Processing document 4_2025-03-06
2025-11-14 15:45:24,180 - INFO - Finished converting document 4_2025-03-06 in 0.12 sec.
2025-11-14 15:45:24,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:24,250 - INFO - Going to convert document batch...
2025-11-14 15:45:24,252 - INFO - Processing document 4_2025-05-05
2025-11-14 15:45:24,286 - INFO - Finished converting document 4_2025-05-05 in 0.06 sec.
2025-11-14 15:45:24,380 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:24,381 - ERROR - Input document 4_2025-05-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\BKNG\4_2025-03-06' --> 'data\processed_data\BKNG\4_2025-03-06.md'
Converted 'data\edgar_documents\BKNG\4_2025-05-05' --> 'data\processed_data\BKNG\4_2025-05-05.md'
Error processing data\edgar_documents\BKNG\4_2025-05-06: File format not allowed: data\edgar_documents\BKNG\4_2025-05-06


2025-11-14 15:45:24,418 - ERROR - Input document 4_2025-05-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:24,421 - INFO - Going to convert document batch...
2025-11-14 15:45:24,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:24,485 - INFO - Going to convert document batch...
2025-11-14 15:45:24,487 - INFO - Processing document 4_2025-05-13
2025-11-14 15:45:24,550 - INFO - Finished converting document 4_2025-05-13 in 0.12 sec.
2025-11-14 15:45:24,619 - INFO - detec

Error processing data\edgar_documents\BKNG\4_2025-05-07: File format not allowed: data\edgar_documents\BKNG\4_2025-05-07
Converted 'data\edgar_documents\BKNG\4_2025-05-13' --> 'data\processed_data\BKNG\4_2025-05-13.md'


2025-11-14 15:45:24,688 - INFO - Going to convert document batch...
2025-11-14 15:45:24,691 - INFO - Processing document 4_2025-05-16
2025-11-14 15:45:24,893 - INFO - Finished converting document 4_2025-05-16 in 0.30 sec.
2025-11-14 15:45:25,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:25,107 - INFO - Going to convert document batch...
2025-11-14 15:45:25,109 - INFO - Processing document 4_2025-06-02
2025-11-14 15:45:25,171 - INFO - Finished converting document 4_2025-06-02 in 0.12 sec.
2025-11-14 15:45:25,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2025-05-16' --> 'data\processed_data\BKNG\4_2025-05-16.md'
Converted 'data\edgar_documents\BKNG\4_2025-06-02' --> 'data\processed_data\BKNG\4_2025-06-02.md'


2025-11-14 15:45:25,283 - INFO - Going to convert document batch...
2025-11-14 15:45:25,284 - INFO - Processing document 4_2025-06-17
2025-11-14 15:45:25,385 - INFO - Finished converting document 4_2025-06-17 in 0.17 sec.
2025-11-14 15:45:25,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2025-06-17' --> 'data\processed_data\BKNG\4_2025-06-17.md'


2025-11-14 15:45:26,301 - INFO - Going to convert document batch...
2025-11-14 15:45:26,303 - INFO - Processing document 4_2025-07-16
2025-11-14 15:45:26,392 - INFO - Finished converting document 4_2025-07-16 in 0.91 sec.
2025-11-14 15:45:26,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:26,534 - INFO - Going to convert document batch...
2025-11-14 15:45:26,536 - INFO - Processing document 4_2025-08-01
2025-11-14 15:45:26,601 - INFO - Finished converting document 4_2025-08-01 in 0.12 sec.
2025-11-14 15:45:26,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2025-07-16' --> 'data\processed_data\BKNG\4_2025-07-16.md'
Converted 'data\edgar_documents\BKNG\4_2025-08-01' --> 'data\processed_data\BKNG\4_2025-08-01.md'


2025-11-14 15:45:26,722 - INFO - Going to convert document batch...
2025-11-14 15:45:26,724 - INFO - Processing document 4_2025-08-18
2025-11-14 15:45:26,843 - INFO - Finished converting document 4_2025-08-18 in 0.20 sec.
2025-11-14 15:45:26,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:27,021 - INFO - Going to convert document batch...
2025-11-14 15:45:27,022 - INFO - Processing document 4_2025-09-09


Converted 'data\edgar_documents\BKNG\4_2025-08-18' --> 'data\processed_data\BKNG\4_2025-08-18.md'


2025-11-14 15:45:27,180 - INFO - Finished converting document 4_2025-09-09 in 0.27 sec.
2025-11-14 15:45:27,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:27,390 - INFO - Going to convert document batch...
2025-11-14 15:45:27,393 - INFO - Processing document 4_2025-09-16


Converted 'data\edgar_documents\BKNG\4_2025-09-09' --> 'data\processed_data\BKNG\4_2025-09-09.md'


2025-11-14 15:45:27,590 - INFO - Finished converting document 4_2025-09-16 in 0.30 sec.
2025-11-14 15:45:27,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:27,805 - INFO - Going to convert document batch...
2025-11-14 15:45:27,809 - INFO - Processing document 4_2025-10-16


Converted 'data\edgar_documents\BKNG\4_2025-09-16' --> 'data\processed_data\BKNG\4_2025-09-16.md'


2025-11-14 15:45:27,923 - INFO - Finished converting document 4_2025-10-16 in 0.20 sec.
2025-11-14 15:45:28,065 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:28,067 - ERROR - Input document 4_2025-11-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:28,070 - INFO - Going to convert document batch...
2025-11-14 15:45:28,113 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:28,115 - ERROR - Input document 4_2025-11-05 with forma

Converted 'data\edgar_documents\BKNG\4_2025-10-16' --> 'data\processed_data\BKNG\4_2025-10-16.md'
Error processing data\edgar_documents\BKNG\4_2025-11-04: File format not allowed: data\edgar_documents\BKNG\4_2025-11-04
Error processing data\edgar_documents\BKNG\4_2025-11-05: File format not allowed: data\edgar_documents\BKNG\4_2025-11-05


2025-11-14 15:45:28,240 - INFO - Finished converting document 4_2025-11-10 in 0.11 sec.
2025-11-14 15:45:28,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:28,346 - INFO - Going to convert document batch...
2025-11-14 15:45:28,348 - INFO - Processing document 8-K_2023-01-13
2025-11-14 15:45:28,392 - INFO - Finished converting document 8-K_2023-01-13 in 0.11 sec.
2025-11-14 15:45:28,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2025-11-10' --> 'data\processed_data\BKNG\4_2025-11-10.md'
Converted 'data\edgar_documents\BKNG\8-K_2023-01-13' --> 'data\processed_data\BKNG\8-K_2023-01-13.md'


2025-11-14 15:45:28,545 - INFO - Going to convert document batch...
2025-11-14 15:45:28,547 - INFO - Processing document 8-K_2023-02-23
2025-11-14 15:45:28,598 - INFO - Finished converting document 8-K_2023-02-23 in 0.17 sec.
2025-11-14 15:45:28,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:28,716 - INFO - Going to convert document batch...
2025-11-14 15:45:28,719 - INFO - Processing document 8-K_2023-04-11
2025-11-14 15:45:28,803 - INFO - Finished converting document 8-K_2023-04-11 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-02-23' --> 'data\processed_data\BKNG\8-K_2023-02-23.md'


2025-11-14 15:45:28,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:28,945 - INFO - Going to convert document batch...
2025-11-14 15:45:28,946 - INFO - Processing document 8-K_2023-04-24
2025-11-14 15:45:29,005 - INFO - Finished converting document 8-K_2023-04-24 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-04-11' --> 'data\processed_data\BKNG\8-K_2023-04-11.md'
Converted 'data\edgar_documents\BKNG\8-K_2023-04-24' --> 'data\processed_data\BKNG\8-K_2023-04-24.md'


2025-11-14 15:45:29,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:29,103 - INFO - Going to convert document batch...
2025-11-14 15:45:29,104 - INFO - Processing document 8-K_2023-05-04
2025-11-14 15:45:29,146 - INFO - Finished converting document 8-K_2023-05-04 in 0.11 sec.
2025-11-14 15:45:29,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:29,260 - INFO - Going to convert document batch...
2025-11-14 15:45:29,263 - INFO - Processing document 8-K_2023-05-12


Converted 'data\edgar_documents\BKNG\8-K_2023-05-04' --> 'data\processed_data\BKNG\8-K_2023-05-04.md'


2025-11-14 15:45:29,402 - INFO - Finished converting document 8-K_2023-05-12 in 0.23 sec.
2025-11-14 15:45:29,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:29,578 - INFO - Going to convert document batch...
2025-11-14 15:45:29,579 - INFO - Processing document 8-K_2023-05-19
2025-11-14 15:45:29,643 - INFO - Finished converting document 8-K_2023-05-19 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-05-12' --> 'data\processed_data\BKNG\8-K_2023-05-12.md'


2025-11-14 15:45:29,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:29,783 - INFO - Going to convert document batch...
2025-11-14 15:45:29,785 - INFO - Processing document 8-K_2023-06-07
2025-11-14 15:45:29,853 - INFO - Finished converting document 8-K_2023-06-07 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-05-19' --> 'data\processed_data\BKNG\8-K_2023-05-19.md'


2025-11-14 15:45:29,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,014 - INFO - Going to convert document batch...
2025-11-14 15:45:30,016 - INFO - Processing document 8-K_2023-07-05
2025-11-14 15:45:30,061 - INFO - Finished converting document 8-K_2023-07-05 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-06-07' --> 'data\processed_data\BKNG\8-K_2023-06-07.md'
Converted 'data\edgar_documents\BKNG\8-K_2023-07-05' --> 'data\processed_data\BKNG\8-K_2023-07-05.md'


2025-11-14 15:45:30,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,187 - INFO - Going to convert document batch...
2025-11-14 15:45:30,188 - INFO - Processing document 8-K_2023-08-03
2025-11-14 15:45:30,246 - INFO - Finished converting document 8-K_2023-08-03 in 0.17 sec.
2025-11-14 15:45:30,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,371 - INFO - Going to convert document batch...
2025-11-14 15:45:30,381 - INFO - Processing document 8-K_2023-09-25
2025-11-14 15:45:30,467 - INFO - Finished converting document 8-K_2023-09-25 in 0.20 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-08-03' --> 'data\processed_data\BKNG\8-K_2023-08-03.md'


2025-11-14 15:45:30,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,646 - INFO - Going to convert document batch...
2025-11-14 15:45:30,648 - INFO - Processing document 8-K_2023-10-24
2025-11-14 15:45:30,719 - INFO - Finished converting document 8-K_2023-10-24 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-09-25' --> 'data\processed_data\BKNG\8-K_2023-09-25.md'
Converted 'data\edgar_documents\BKNG\8-K_2023-10-24' --> 'data\processed_data\BKNG\8-K_2023-10-24.md'


2025-11-14 15:45:30,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,877 - INFO - Going to convert document batch...
2025-11-14 15:45:30,879 - INFO - Processing document 8-K_2023-11-02
2025-11-14 15:45:30,948 - INFO - Finished converting document 8-K_2023-11-02 in 0.20 sec.
2025-11-14 15:45:31,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:31,110 - INFO - Going to convert document batch...
2025-11-14 15:45:31,112 - INFO - Processing document 8-K_2023-12-13
2025-11-14 15:45:31,195 - INFO - Finished converting document 8-K_2023-12-13 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-11-02' --> 'data\processed_data\BKNG\8-K_2023-11-02.md'


2025-11-14 15:45:31,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:31,326 - INFO - Going to convert document batch...
2025-11-14 15:45:31,328 - INFO - Processing document 8-K_2024-01-19
2025-11-14 15:45:31,402 - INFO - Finished converting document 8-K_2024-01-19 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-12-13' --> 'data\processed_data\BKNG\8-K_2023-12-13.md'


2025-11-14 15:45:31,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:31,533 - INFO - Going to convert document batch...
2025-11-14 15:45:31,534 - INFO - Processing document 8-K_2024-02-22
2025-11-14 15:45:31,605 - INFO - Finished converting document 8-K_2024-02-22 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2024-01-19' --> 'data\processed_data\BKNG\8-K_2024-01-19.md'
Converted 'data\edgar_documents\BKNG\8-K_2024-02-22' --> 'data\processed_data\BKNG\8-K_2024-02-22.md'


2025-11-14 15:45:31,666 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:31,710 - INFO - Going to convert document batch...
2025-11-14 15:45:31,712 - INFO - Processing document 8-K_2024-03-01
2025-11-14 15:45:31,884 - INFO - Finished converting document 8-K_2024-03-01 in 0.25 sec.
2025-11-14 15:45:32,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:32,097 - INFO - Going to convert document batch...
2025-11-14 15:45:32,099 - INFO - Processing document 8-K_2024-04-05


Converted 'data\edgar_documents\BKNG\8-K_2024-03-01' --> 'data\processed_data\BKNG\8-K_2024-03-01.md'


2025-11-14 15:45:32,201 - INFO - Finished converting document 8-K_2024-04-05 in 0.23 sec.
2025-11-14 15:45:32,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:32,322 - INFO - Going to convert document batch...
2025-11-14 15:45:32,324 - INFO - Processing document 8-K_2024-04-22
2025-11-14 15:45:32,406 - INFO - Finished converting document 8-K_2024-04-22 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2024-04-05' --> 'data\processed_data\BKNG\8-K_2024-04-05.md'


2025-11-14 15:45:32,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:32,586 - INFO - Going to convert document batch...
2025-11-14 15:45:32,588 - INFO - Processing document 8-K_2024-05-02


Converted 'data\edgar_documents\BKNG\8-K_2024-04-22' --> 'data\processed_data\BKNG\8-K_2024-04-22.md'


2025-11-14 15:45:32,667 - INFO - Finished converting document 8-K_2024-05-02 in 0.20 sec.
2025-11-14 15:45:32,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:32,752 - INFO - Going to convert document batch...
2025-11-14 15:45:32,753 - INFO - Processing document 8-K_2024-05-10
2025-11-14 15:45:32,807 - INFO - Finished converting document 8-K_2024-05-10 in 0.11 sec.
2025-11-14 15:45:32,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\8-K_2024-05-02' --> 'data\processed_data\BKNG\8-K_2024-05-02.md'
Converted 'data\edgar_documents\BKNG\8-K_2024-05-10' --> 'data\processed_data\BKNG\8-K_2024-05-10.md'


2025-11-14 15:45:32,917 - INFO - Going to convert document batch...
2025-11-14 15:45:32,918 - INFO - Processing document 8-K_2024-06-05
2025-11-14 15:45:33,040 - INFO - Finished converting document 8-K_2024-06-05 in 0.20 sec.
2025-11-14 15:45:33,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:33,147 - INFO - Going to convert document batch...
2025-11-14 15:45:33,149 - INFO - Processing document 8-K_2024-08-01
2025-11-14 15:45:33,217 - INFO - Finished converting document 8-K_2024-08-01 in 0.14 sec.
2025-11-14 15:45:33,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\8-K_2024-06-05' --> 'data\processed_data\BKNG\8-K_2024-06-05.md'
Converted 'data\edgar_documents\BKNG\8-K_2024-08-01' --> 'data\processed_data\BKNG\8-K_2024-08-01.md'


2025-11-14 15:45:33,335 - INFO - Going to convert document batch...
2025-11-14 15:45:33,337 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:45:33,408 - INFO - Finished converting document 8-K_2024-10-30 in 0.16 sec.
2025-11-14 15:45:33,477 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:33,479 - ERROR - Input document 8-K_2024-11-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:33,481 - INFO - Going to convert docu

Converted 'data\edgar_documents\BKNG\8-K_2024-10-30' --> 'data\processed_data\BKNG\8-K_2024-10-30.md'
Error processing data\edgar_documents\BKNG\8-K_2024-11-08: File format not allowed: data\edgar_documents\BKNG\8-K_2024-11-08


2025-11-14 15:45:33,693 - INFO - Finished converting document 8-K_2024-11-21 in 0.20 sec.
2025-11-14 15:45:33,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:33,850 - INFO - Going to convert document batch...
2025-11-14 15:45:33,851 - INFO - Processing document 8-K_2024-12-10


Converted 'data\edgar_documents\BKNG\8-K_2024-11-21' --> 'data\processed_data\BKNG\8-K_2024-11-21.md'


2025-11-14 15:45:34,652 - INFO - Finished converting document 8-K_2024-12-10 in 0.88 sec.
2025-11-14 15:45:34,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:34,785 - INFO - Going to convert document batch...
2025-11-14 15:45:34,787 - INFO - Processing document 8-K_2024-12-18
2025-11-14 15:45:34,882 - INFO - Finished converting document 8-K_2024-12-18 in 0.19 sec.


Converted 'data\edgar_documents\BKNG\8-K_2024-12-10' --> 'data\processed_data\BKNG\8-K_2024-12-10.md'


2025-11-14 15:45:34,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:35,014 - INFO - Going to convert document batch...
2025-11-14 15:45:35,016 - INFO - Processing document 8-K_2025-02-20
2025-11-14 15:45:35,068 - INFO - Finished converting document 8-K_2025-02-20 in 0.12 sec.


Converted 'data\edgar_documents\BKNG\8-K_2024-12-18' --> 'data\processed_data\BKNG\8-K_2024-12-18.md'
Converted 'data\edgar_documents\BKNG\8-K_2025-02-20' --> 'data\processed_data\BKNG\8-K_2025-02-20.md'


2025-11-14 15:45:35,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:35,204 - INFO - Going to convert document batch...
2025-11-14 15:45:35,207 - INFO - Processing document 8-K_2025-04-22
2025-11-14 15:45:35,261 - INFO - Finished converting document 8-K_2025-04-22 in 0.17 sec.
2025-11-14 15:45:35,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:35,419 - INFO - Going to convert document batch...
2025-11-14 15:45:35,423 - INFO - Processing document 8-K_2025-04-29


Converted 'data\edgar_documents\BKNG\8-K_2025-04-22' --> 'data\processed_data\BKNG\8-K_2025-04-22.md'


2025-11-14 15:45:35,520 - INFO - Finished converting document 8-K_2025-04-29 in 0.22 sec.
2025-11-14 15:45:35,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:35,660 - INFO - Going to convert document batch...
2025-11-14 15:45:35,662 - INFO - Processing document 8-K_2025-05-09


Converted 'data\edgar_documents\BKNG\8-K_2025-04-29' --> 'data\processed_data\BKNG\8-K_2025-04-29.md'


2025-11-14 15:45:35,838 - INFO - Finished converting document 8-K_2025-05-09 in 0.28 sec.
2025-11-14 15:45:35,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:36,064 - INFO - Going to convert document batch...
2025-11-14 15:45:36,065 - INFO - Processing document 8-K_2025-06-04


Converted 'data\edgar_documents\BKNG\8-K_2025-05-09' --> 'data\processed_data\BKNG\8-K_2025-05-09.md'


2025-11-14 15:45:36,161 - INFO - Finished converting document 8-K_2025-06-04 in 0.22 sec.
2025-11-14 15:45:36,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:36,287 - INFO - Going to convert document batch...
2025-11-14 15:45:36,290 - INFO - Processing document 8-K_2025-07-29
2025-11-14 15:45:36,377 - INFO - Finished converting document 8-K_2025-07-29 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2025-06-04' --> 'data\processed_data\BKNG\8-K_2025-06-04.md'
Converted 'data\edgar_documents\BKNG\8-K_2025-07-29' --> 'data\processed_data\BKNG\8-K_2025-07-29.md'


2025-11-14 15:45:36,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:36,577 - INFO - Going to convert document batch...
2025-11-14 15:45:36,581 - INFO - Processing document 8-K_2025-09-19
2025-11-14 15:45:36,687 - INFO - Finished converting document 8-K_2025-09-19 in 0.27 sec.
2025-11-14 15:45:36,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:36,753 - INFO - Going to convert document batch...
2025-11-14 15:45:36,754 - INFO - Processing document 8-K_2025-10-17
2025-11-14 15:45:36,802 - INFO - Finished converting document 8-K_2025-10-17 in 0.09 sec.
2025-11-14 15:45:36,890 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\8-K_2025-09-19' --> 'data\processed_data\BKNG\8-K_2025-09-19.md'
Converted 'data\edgar_documents\BKNG\8-K_2025-10-17' --> 'data\processed_data\BKNG\8-K_2025-10-17.md'


2025-11-14 15:45:36,954 - INFO - Going to convert document batch...
2025-11-14 15:45:36,957 - INFO - Processing document 8-K_2025-10-28
2025-11-14 15:45:37,027 - INFO - Finished converting document 8-K_2025-10-28 in 0.19 sec.
2025-11-14 15:45:37,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:37,145 - INFO - Going to convert document batch...
2025-11-14 15:45:37,146 - INFO - Processing document 8-K_2025-11-07
2025-11-14 15:45:37,243 - INFO - Finished converting document 8-K_2025-11-07 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2025-10-28' --> 'data\processed_data\BKNG\8-K_2025-10-28.md'


2025-11-14 15:45:37,339 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:37,341 - ERROR - Input document DEF-14A_2023-04-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:37,343 - INFO - Going to convert document batch...
2025-11-14 15:45:37,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\8-K_2025-11-07' --> 'data\processed_data\BKNG\8-K_2025-11-07.md'
Error processing data\edgar_documents\BKNG\DEF-14A_2023-04-24: File format not allowed: data\edgar_documents\BKNG\DEF-14A_2023-04-24


2025-11-14 15:45:38,549 - INFO - Going to convert document batch...
2025-11-14 15:45:38,551 - INFO - Processing document DEF-14A_2024-04-23
2025-11-14 15:45:42,365 - INFO - Finished converting document DEF-14A_2024-04-23 in 5.01 sec.
2025-11-14 15:45:45,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\DEF-14A_2024-04-23' --> 'data\processed_data\BKNG\DEF-14A_2024-04-23.md'


2025-11-14 15:45:47,097 - INFO - Going to convert document batch...
2025-11-14 15:45:47,099 - INFO - Processing document DEF-14A_2025-04-22
2025-11-14 15:45:50,375 - INFO - Finished converting document DEF-14A_2025-04-22 in 5.31 sec.


Converted 'data\edgar_documents\BKNG\DEF-14A_2025-04-22' --> 'data\processed_data\BKNG\DEF-14A_2025-04-22.md'
Processed 112 new files. Errors: 12
Found 62 files to process in data\edgar_documents\BLK


2025-11-14 15:45:53,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:46:00,127 - INFO - Going to convert document batch...
2025-11-14 15:46:00,128 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:46:00,129 - INFO - Processing document 10-K_2025-02-25
2025-11-14 15:46:13,892 - INFO - Finished converting document 10-K_2025-02-25 in 21.06 sec.


Converted 'data\edgar_documents\BLK\10-K_2025-02-25' --> 'data\processed_data\BLK\10-K_2025-02-25.md'


2025-11-14 15:46:15,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:46:21,651 - INFO - Going to convert document batch...
2025-11-14 15:46:21,652 - INFO - Processing document 10-Q_2024-11-06
2025-11-14 15:46:28,105 - INFO - Finished converting document 10-Q_2024-11-06 in 12.36 sec.
2025-11-14 15:46:29,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\10-Q_2024-11-06' --> 'data\processed_data\BLK\10-Q_2024-11-06.md'


2025-11-14 15:46:35,057 - INFO - Going to convert document batch...
2025-11-14 15:46:35,059 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 15:46:41,117 - INFO - Finished converting document 10-Q_2025-05-07 in 11.73 sec.
2025-11-14 15:46:42,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\10-Q_2025-05-07' --> 'data\processed_data\BLK\10-Q_2025-05-07.md'


2025-11-14 15:46:48,792 - INFO - Going to convert document batch...
2025-11-14 15:46:48,794 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 15:46:57,183 - INFO - Finished converting document 10-Q_2025-08-06 in 15.25 sec.


Converted 'data\edgar_documents\BLK\10-Q_2025-08-06' --> 'data\processed_data\BLK\10-Q_2025-08-06.md'


2025-11-14 15:46:58,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:06,720 - INFO - Going to convert document batch...
2025-11-14 15:47:06,722 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 15:47:15,819 - INFO - Finished converting document 10-Q_2025-11-05 in 17.17 sec.
2025-11-14 15:47:17,399 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:47:17,400 - ERROR - Input document 4_2024-03-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-1

Converted 'data\edgar_documents\BLK\10-Q_2025-11-05' --> 'data\processed_data\BLK\10-Q_2025-11-05.md'
Error processing data\edgar_documents\BLK\4_2024-03-05: File format not allowed: data\edgar_documents\BLK\4_2024-03-05
Error processing data\edgar_documents\BLK\4_2024-03-07: File format not allowed: data\edgar_documents\BLK\4_2024-03-07
Error processing data\edgar_documents\BLK\4_2024-07-17: File format not allowed: data\edgar_documents\BLK\4_2024-07-17
Error processing data\edgar_documents\BLK\4_2024-07-19: File format not allowed: data\edgar_documents\BLK\4_2024-07-19


2025-11-14 15:47:17,574 - INFO - Going to convert document batch...
2025-11-14 15:47:17,580 - INFO - Processing document 4_2024-10-02
2025-11-14 15:47:17,627 - INFO - Finished converting document 4_2024-10-02 in 0.11 sec.
2025-11-14 15:47:17,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:17,762 - INFO - Going to convert document batch...
2025-11-14 15:47:17,765 - INFO - Processing document 4_2024-12-06
2025-11-14 15:47:17,879 - INFO - Finished converting document 4_2024-12-06 in 0.17 sec.


Converted 'data\edgar_documents\BLK\4_2024-10-02' --> 'data\processed_data\BLK\4_2024-10-02.md'


2025-11-14 15:47:17,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,007 - INFO - Going to convert document batch...
2025-11-14 15:47:18,010 - INFO - Processing document 4_2025-01-03
2025-11-14 15:47:18,061 - INFO - Finished converting document 4_2025-01-03 in 0.09 sec.
2025-11-14 15:47:18,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\4_2024-12-06' --> 'data\processed_data\BLK\4_2024-12-06.md'
Converted 'data\edgar_documents\BLK\4_2025-01-03' --> 'data\processed_data\BLK\4_2025-01-03.md'


2025-11-14 15:47:18,172 - INFO - Going to convert document batch...
2025-11-14 15:47:18,175 - INFO - Processing document 4_2025-01-17
2025-11-14 15:47:18,235 - INFO - Finished converting document 4_2025-01-17 in 0.11 sec.
2025-11-14 15:47:18,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,331 - INFO - Going to convert document batch...
2025-11-14 15:47:18,332 - INFO - Processing document 4_2025-01-23
2025-11-14 15:47:18,385 - INFO - Finished converting document 4_2025-01-23 in 0.11 sec.


Converted 'data\edgar_documents\BLK\4_2025-01-17' --> 'data\processed_data\BLK\4_2025-01-17.md'
Converted 'data\edgar_documents\BLK\4_2025-01-23' --> 'data\processed_data\BLK\4_2025-01-23.md'


2025-11-14 15:47:18,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,536 - INFO - Going to convert document batch...
2025-11-14 15:47:18,537 - INFO - Processing document 4_2025-01-31
2025-11-14 15:47:18,606 - INFO - Finished converting document 4_2025-01-31 in 0.14 sec.
2025-11-14 15:47:18,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,742 - INFO - Going to convert document batch...
2025-11-14 15:47:18,743 - INFO - Processing document 4_2025-02-04
2025-11-14 15:47:18,812 - INFO - Finished converting document 4_2025-02-04 in 0.14 sec.


Converted 'data\edgar_documents\BLK\4_2025-01-31' --> 'data\processed_data\BLK\4_2025-01-31.md'


2025-11-14 15:47:18,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,914 - INFO - Going to convert document batch...
2025-11-14 15:47:18,915 - INFO - Processing document 4_2025-02-28
2025-11-14 15:47:18,974 - INFO - Finished converting document 4_2025-02-28 in 0.11 sec.


Converted 'data\edgar_documents\BLK\4_2025-02-04' --> 'data\processed_data\BLK\4_2025-02-04.md'
Converted 'data\edgar_documents\BLK\4_2025-02-28' --> 'data\processed_data\BLK\4_2025-02-28.md'


2025-11-14 15:47:19,061 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,088 - INFO - Going to convert document batch...
2025-11-14 15:47:19,090 - INFO - Processing document 4_2025-03-04
2025-11-14 15:47:19,143 - INFO - Finished converting document 4_2025-03-04 in 0.11 sec.
2025-11-14 15:47:19,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,245 - INFO - Going to convert document batch...
2025-11-14 15:47:19,246 - INFO - Processing document 4_2025-03-06
2025-11-14 15:47:19,298 - INFO - Finished converting document 4_2025-03-06 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-04' --> 'data\processed_data\BLK\4_2025-03-04.md'
Converted 'data\edgar_documents\BLK\4_2025-03-06' --> 'data\processed_data\BLK\4_2025-03-06.md'


2025-11-14 15:47:19,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,422 - INFO - Going to convert document batch...
2025-11-14 15:47:19,424 - INFO - Processing document 4_2025-03-07
2025-11-14 15:47:19,477 - INFO - Finished converting document 4_2025-03-07 in 0.11 sec.
2025-11-14 15:47:19,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,586 - INFO - Going to convert document batch...
2025-11-14 15:47:19,587 - INFO - Processing document 4_2025-03-10
2025-11-14 15:47:19,650 - INFO - Finished converting document 4_2025-03-10 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-07' --> 'data\processed_data\BLK\4_2025-03-07.md'
Converted 'data\edgar_documents\BLK\4_2025-03-10' --> 'data\processed_data\BLK\4_2025-03-10.md'


2025-11-14 15:47:19,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,778 - INFO - Going to convert document batch...
2025-11-14 15:47:19,780 - INFO - Processing document 4_2025-03-11
2025-11-14 15:47:19,844 - INFO - Finished converting document 4_2025-03-11 in 0.12 sec.
2025-11-14 15:47:19,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,933 - INFO - Going to convert document batch...
2025-11-14 15:47:19,935 - INFO - Processing document 4_2025-03-12
2025-11-14 15:47:19,993 - INFO - Finished converting document 4_2025-03-12 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-11' --> 'data\processed_data\BLK\4_2025-03-11.md'
Converted 'data\edgar_documents\BLK\4_2025-03-12' --> 'data\processed_data\BLK\4_2025-03-12.md'


2025-11-14 15:47:20,086 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,116 - INFO - Going to convert document batch...
2025-11-14 15:47:20,118 - INFO - Processing document 4_2025-03-13
2025-11-14 15:47:20,163 - INFO - Finished converting document 4_2025-03-13 in 0.09 sec.
2025-11-14 15:47:20,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,272 - INFO - Going to convert document batch...
2025-11-14 15:47:20,275 - INFO - Processing document 4_2025-03-14
2025-11-14 15:47:20,354 - INFO - Finished converting document 4_2025-03-14 in 0.12 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-13' --> 'data\processed_data\BLK\4_2025-03-13.md'
Converted 'data\edgar_documents\BLK\4_2025-03-14' --> 'data\processed_data\BLK\4_2025-03-14.md'


2025-11-14 15:47:20,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,464 - INFO - Going to convert document batch...
2025-11-14 15:47:20,465 - INFO - Processing document 4_2025-03-17
2025-11-14 15:47:20,534 - INFO - Finished converting document 4_2025-03-17 in 0.12 sec.
2025-11-14 15:47:20,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,616 - INFO - Going to convert document batch...
2025-11-14 15:47:20,618 - INFO - Processing document 4_2025-03-18
2025-11-14 15:47:20,674 - INFO - Finished converting document 4_2025-03-18 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-17' --> 'data\processed_data\BLK\4_2025-03-17.md'
Converted 'data\edgar_documents\BLK\4_2025-03-18' --> 'data\processed_data\BLK\4_2025-03-18.md'


2025-11-14 15:47:20,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,802 - INFO - Going to convert document batch...
2025-11-14 15:47:20,804 - INFO - Processing document 4_2025-03-19
2025-11-14 15:47:20,840 - INFO - Finished converting document 4_2025-03-19 in 0.11 sec.
2025-11-14 15:47:20,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,924 - INFO - Going to convert document batch...
2025-11-14 15:47:20,927 - INFO - Processing document 4_2025-03-20
2025-11-14 15:47:20,964 - INFO - Finished converting document 4_2025-03-20 in 0.09 sec.
2025-11-14 15:47:21,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\4_2025-03-19' --> 'data\processed_data\BLK\4_2025-03-19.md'
Converted 'data\edgar_documents\BLK\4_2025-03-20' --> 'data\processed_data\BLK\4_2025-03-20.md'


2025-11-14 15:47:21,070 - INFO - Going to convert document batch...
2025-11-14 15:47:21,074 - INFO - Processing document 4_2025-03-21
2025-11-14 15:47:21,189 - INFO - Finished converting document 4_2025-03-21 in 0.19 sec.
2025-11-14 15:47:21,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:21,317 - INFO - Going to convert document batch...
2025-11-14 15:47:21,319 - INFO - Processing document 4_2025-03-24
2025-11-14 15:47:21,389 - INFO - Finished converting document 4_2025-03-24 in 0.11 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-21' --> 'data\processed_data\BLK\4_2025-03-21.md'
Converted 'data\edgar_documents\BLK\4_2025-03-24' --> 'data\processed_data\BLK\4_2025-03-24.md'


2025-11-14 15:47:21,478 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:47:21,480 - ERROR - Input document 4_2025-03-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:47:21,483 - INFO - Going to convert document batch...
2025-11-14 15:47:21,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:21,532 - INFO - Going to convert document batch...
2025-11-14 15:47:21,533 - INFO - Processing document 4_2025-04-02
2025-11-14 15:47:21,576 - INFO - Fin

Error processing data\edgar_documents\BLK\4_2025-03-27: File format not allowed: data\edgar_documents\BLK\4_2025-03-27
Converted 'data\edgar_documents\BLK\4_2025-04-02' --> 'data\processed_data\BLK\4_2025-04-02.md'


2025-11-14 15:47:21,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:21,832 - INFO - Going to convert document batch...
2025-11-14 15:47:21,837 - INFO - Processing document 4_2025-04-23
2025-11-14 15:47:21,913 - INFO - Finished converting document 4_2025-04-23 in 0.12 sec.


Converted 'data\edgar_documents\BLK\4_2025-04-17' --> 'data\processed_data\BLK\4_2025-04-17.md'
Converted 'data\edgar_documents\BLK\4_2025-04-23' --> 'data\processed_data\BLK\4_2025-04-23.md'


2025-11-14 15:47:22,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:22,049 - INFO - Going to convert document batch...
2025-11-14 15:47:22,050 - INFO - Processing document 4_2025-04-28
2025-11-14 15:47:22,125 - INFO - Finished converting document 4_2025-04-28 in 0.14 sec.
2025-11-14 15:47:22,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:22,267 - INFO - Going to convert document batch...
2025-11-14 15:47:22,269 - INFO - Processing document 4_2025-05-01
2025-11-14 15:47:22,362 - INFO - Finished converting document 4_2025-05-01 in 0.17 sec.


Converted 'data\edgar_documents\BLK\4_2025-04-28' --> 'data\processed_data\BLK\4_2025-04-28.md'


2025-11-14 15:47:22,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:22,493 - INFO - Going to convert document batch...
2025-11-14 15:47:22,495 - INFO - Processing document 4_2025-05-21
2025-11-14 15:47:22,547 - INFO - Finished converting document 4_2025-05-21 in 0.09 sec.
2025-11-14 15:47:22,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\4_2025-05-01' --> 'data\processed_data\BLK\4_2025-05-01.md'
Converted 'data\edgar_documents\BLK\4_2025-05-21' --> 'data\processed_data\BLK\4_2025-05-21.md'


2025-11-14 15:47:22,670 - INFO - Going to convert document batch...
2025-11-14 15:47:22,673 - INFO - Processing document 4_2025-05-28
2025-11-14 15:47:22,780 - INFO - Finished converting document 4_2025-05-28 in 0.19 sec.
2025-11-14 15:47:22,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:22,869 - INFO - Going to convert document batch...
2025-11-14 15:47:22,871 - INFO - Processing document 4_2025-07-02
2025-11-14 15:47:22,931 - INFO - Finished converting document 4_2025-07-02 in 0.09 sec.
2025-11-14 15:47:23,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\4_2025-05-28' --> 'data\processed_data\BLK\4_2025-05-28.md'
Converted 'data\edgar_documents\BLK\4_2025-07-02' --> 'data\processed_data\BLK\4_2025-07-02.md'


2025-11-14 15:47:23,040 - INFO - Going to convert document batch...
2025-11-14 15:47:23,041 - INFO - Processing document 4_2025-07-18
2025-11-14 15:47:23,085 - INFO - Finished converting document 4_2025-07-18 in 0.09 sec.
2025-11-14 15:47:23,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,170 - INFO - Going to convert document batch...
2025-11-14 15:47:23,172 - INFO - Processing document 4_2025-07-25
2025-11-14 15:47:23,230 - INFO - Finished converting document 4_2025-07-25 in 0.11 sec.


Converted 'data\edgar_documents\BLK\4_2025-07-18' --> 'data\processed_data\BLK\4_2025-07-18.md'
Converted 'data\edgar_documents\BLK\4_2025-07-25' --> 'data\processed_data\BLK\4_2025-07-25.md'


2025-11-14 15:47:23,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,348 - INFO - Going to convert document batch...
2025-11-14 15:47:23,349 - INFO - Processing document 4_2025-08-01
2025-11-14 15:47:23,408 - INFO - Finished converting document 4_2025-08-01 in 0.12 sec.
2025-11-14 15:47:23,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,494 - INFO - Going to convert document batch...
2025-11-14 15:47:23,495 - INFO - Processing document 4_2025-10-02
2025-11-14 15:47:23,552 - INFO - Finished converting document 4_2025-10-02 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-08-01' --> 'data\processed_data\BLK\4_2025-08-01.md'
Converted 'data\edgar_documents\BLK\4_2025-10-02' --> 'data\processed_data\BLK\4_2025-10-02.md'


2025-11-14 15:47:23,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,676 - INFO - Going to convert document batch...
2025-11-14 15:47:23,677 - INFO - Processing document 4_2025-10-22
2025-11-14 15:47:23,783 - INFO - Finished converting document 4_2025-10-22 in 0.17 sec.
2025-11-14 15:47:23,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,974 - INFO - Going to convert document batch...
2025-11-14 15:47:23,976 - INFO - Processing document 8-K_2024-10-01
2025-11-14 15:47:24,035 - INFO - Finished converting document 8-K_2024-10-01 in 0.16 sec.


Converted 'data\edgar_documents\BLK\4_2025-10-22' --> 'data\processed_data\BLK\4_2025-10-22.md'
Converted 'data\edgar_documents\BLK\8-K_2024-10-01' --> 'data\processed_data\BLK\8-K_2024-10-01.md'


2025-11-14 15:47:24,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,151 - INFO - Going to convert document batch...
2025-11-14 15:47:24,153 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:47:24,192 - INFO - Finished converting document 8-K_2024-10-11 in 0.12 sec.
2025-11-14 15:47:24,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,281 - INFO - Going to convert document batch...
2025-11-14 15:47:24,283 - INFO - Processing document 8-K_2024-11-08
2025-11-14 15:47:24,344 - INFO - Finished converting document 8-K_2024-11-08 in 0.11 sec.


Converted 'data\edgar_documents\BLK\8-K_2024-10-11' --> 'data\processed_data\BLK\8-K_2024-10-11.md'
Converted 'data\edgar_documents\BLK\8-K_2024-11-08' --> 'data\processed_data\BLK\8-K_2024-11-08.md'


2025-11-14 15:47:24,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,461 - INFO - Going to convert document batch...
2025-11-14 15:47:24,462 - INFO - Processing document 8-K_2024-11-19
2025-11-14 15:47:24,513 - INFO - Finished converting document 8-K_2024-11-19 in 0.14 sec.
2025-11-14 15:47:24,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,594 - INFO - Going to convert document batch...
2025-11-14 15:47:24,596 - INFO - Processing document 8-K_2024-12-03
2025-11-14 15:47:24,637 - INFO - Finished converting document 8-K_2024-12-03 in 0.09 sec.
2025-11-14 15:47:24,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,698 - INFO - Going to convert document batch...
2025-11-14 15:47:24,699 - INFO - Processing document 8-K_2025-01-15
2025-11-14 15:47:24,744 - INFO - Finished converting document 8-K_2025-01-15 in 0.08 sec.


Converted 'data\edgar_documents\BLK\8-K_2024-11-19' --> 'data\processed_data\BLK\8-K_2024-11-19.md'
Converted 'data\edgar_documents\BLK\8-K_2024-12-03' --> 'data\processed_data\BLK\8-K_2024-12-03.md'


2025-11-14 15:47:24,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,820 - INFO - Going to convert document batch...
2025-11-14 15:47:24,823 - INFO - Processing document 8-K_2025-02-14
2025-11-14 15:47:24,857 - INFO - Finished converting document 8-K_2025-02-14 in 0.09 sec.
2025-11-14 15:47:24,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,928 - INFO - Going to convert document batch...
2025-11-14 15:47:24,929 - INFO - Processing document 8-K_2025-03-03
2025-11-14 15:47:24,956 - INFO - Finished converting document 8-K_2025-03-03 in 0.08 sec.


Converted 'data\edgar_documents\BLK\8-K_2025-01-15' --> 'data\processed_data\BLK\8-K_2025-01-15.md'
Converted 'data\edgar_documents\BLK\8-K_2025-02-14' --> 'data\processed_data\BLK\8-K_2025-02-14.md'


2025-11-14 15:47:25,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,041 - INFO - Going to convert document batch...
2025-11-14 15:47:25,043 - INFO - Processing document 8-K_2025-03-26
2025-11-14 15:47:25,088 - INFO - Finished converting document 8-K_2025-03-26 in 0.11 sec.
2025-11-14 15:47:25,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,164 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BLK\8-K_2025-03-03' --> 'data\processed_data\BLK\8-K_2025-03-03.md'
Converted 'data\edgar_documents\BLK\8-K_2025-03-26' --> 'data\processed_data\BLK\8-K_2025-03-26.md'


2025-11-14 15:47:25,174 - INFO - Processing document 8-K_2025-04-03
2025-11-14 15:47:25,228 - INFO - Finished converting document 8-K_2025-04-03 in 0.11 sec.
2025-11-14 15:47:25,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,299 - INFO - Going to convert document batch...
2025-11-14 15:47:25,301 - INFO - Processing document 8-K_2025-04-07
2025-11-14 15:47:25,344 - INFO - Finished converting document 8-K_2025-04-07 in 0.09 sec.
2025-11-14 15:47:25,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\8-K_2025-04-03' --> 'data\processed_data\BLK\8-K_2025-04-03.md'
Converted 'data\edgar_documents\BLK\8-K_2025-04-07' --> 'data\processed_data\BLK\8-K_2025-04-07.md'


2025-11-14 15:47:25,436 - INFO - Going to convert document batch...
2025-11-14 15:47:25,438 - INFO - Processing document 8-K_2025-04-11
2025-11-14 15:47:25,492 - INFO - Finished converting document 8-K_2025-04-11 in 0.11 sec.
2025-11-14 15:47:25,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,595 - INFO - Going to convert document batch...
2025-11-14 15:47:25,597 - INFO - Processing document 8-K_2025-05-16


Converted 'data\edgar_documents\BLK\8-K_2025-04-11' --> 'data\processed_data\BLK\8-K_2025-04-11.md'


2025-11-14 15:47:25,706 - INFO - Finished converting document 8-K_2025-05-16 in 0.20 sec.
2025-11-14 15:47:25,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,781 - INFO - Going to convert document batch...
2025-11-14 15:47:25,783 - INFO - Processing document 8-K_2025-07-01
2025-11-14 15:47:25,823 - INFO - Finished converting document 8-K_2025-07-01 in 0.09 sec.
2025-11-14 15:47:25,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,910 - INFO - Going to convert document batch...
2025-11-14 15:47:25,912 - INFO - Processing document 8-K_2025-07-15
2025-11-14 15:47:25,956 - INFO - Finished converting document 8-K_2025-07-15 in 0.11 sec.


Converted 'data\edgar_documents\BLK\8-K_2025-05-16' --> 'data\processed_data\BLK\8-K_2025-05-16.md'
Converted 'data\edgar_documents\BLK\8-K_2025-07-01' --> 'data\processed_data\BLK\8-K_2025-07-01.md'


2025-11-14 15:47:25,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:26,036 - INFO - Going to convert document batch...
2025-11-14 15:47:26,037 - INFO - Processing document 8-K_2025-10-14
2025-11-14 15:47:26,075 - INFO - Finished converting document 8-K_2025-10-14 in 0.11 sec.


Converted 'data\edgar_documents\BLK\8-K_2025-07-15' --> 'data\processed_data\BLK\8-K_2025-07-15.md'
Converted 'data\edgar_documents\BLK\8-K_2025-10-14' --> 'data\processed_data\BLK\8-K_2025-10-14.md'


2025-11-14 15:47:26,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:30,227 - INFO - Going to convert document batch...
2025-11-14 15:47:30,228 - INFO - Processing document DEF-14A_2025-04-04
2025-11-14 15:47:42,547 - INFO - Finished converting document DEF-14A_2025-04-04 in 16.45 sec.


Converted 'data\edgar_documents\BLK\DEF-14A_2025-04-04' --> 'data\processed_data\BLK\DEF-14A_2025-04-04.md'
Processed 57 new files. Errors: 5
Found 107 files to process in data\edgar_documents\BMY


2025-11-14 15:47:46,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:48,848 - INFO - Going to convert document batch...
2025-11-14 15:47:48,849 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:47:48,850 - INFO - Processing document 10-K_2023-02-14
2025-11-14 15:47:55,371 - INFO - Finished converting document 10-K_2023-02-14 in 9.31 sec.
2025-11-14 15:47:56,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-K_2023-02-14' --> 'data\processed_data\BMY\10-K_2023-02-14.md'


2025-11-14 15:47:57,335 - INFO - Going to convert document batch...
2025-11-14 15:47:57,336 - INFO - Processing document 10-K_2024-02-13
2025-11-14 15:48:00,920 - INFO - Finished converting document 10-K_2024-02-13 in 4.75 sec.
2025-11-14 15:48:01,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-K_2024-02-13' --> 'data\processed_data\BMY\10-K_2024-02-13.md'


2025-11-14 15:48:02,671 - INFO - Going to convert document batch...
2025-11-14 15:48:02,672 - INFO - Processing document 10-K_2025-02-12
2025-11-14 15:48:06,267 - INFO - Finished converting document 10-K_2025-02-12 in 4.48 sec.
2025-11-14 15:48:07,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-K_2025-02-12' --> 'data\processed_data\BMY\10-K_2025-02-12.md'


2025-11-14 15:48:07,620 - INFO - Going to convert document batch...
2025-11-14 15:48:07,621 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 15:48:08,621 - INFO - Finished converting document 10-Q_2023-04-27 in 1.47 sec.
2025-11-14 15:48:09,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2023-04-27' --> 'data\processed_data\BMY\10-Q_2023-04-27.md'


2025-11-14 15:48:10,357 - INFO - Going to convert document batch...
2025-11-14 15:48:10,358 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 15:48:11,465 - INFO - Finished converting document 10-Q_2023-07-27 in 2.42 sec.
2025-11-14 15:48:12,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2023-07-27' --> 'data\processed_data\BMY\10-Q_2023-07-27.md'


2025-11-14 15:48:12,898 - INFO - Going to convert document batch...
2025-11-14 15:48:12,900 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 15:48:14,115 - INFO - Finished converting document 10-Q_2023-10-26 in 2.12 sec.
2025-11-14 15:48:14,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2023-10-26' --> 'data\processed_data\BMY\10-Q_2023-10-26.md'


2025-11-14 15:48:15,163 - INFO - Going to convert document batch...
2025-11-14 15:48:15,164 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 15:48:16,127 - INFO - Finished converting document 10-Q_2024-04-25 in 1.47 sec.
2025-11-14 15:48:16,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2024-04-25' --> 'data\processed_data\BMY\10-Q_2024-04-25.md'


2025-11-14 15:48:17,591 - INFO - Going to convert document batch...
2025-11-14 15:48:17,592 - INFO - Processing document 10-Q_2024-07-26
2025-11-14 15:48:18,796 - INFO - Finished converting document 10-Q_2024-07-26 in 2.20 sec.
2025-11-14 15:48:19,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2024-07-26' --> 'data\processed_data\BMY\10-Q_2024-07-26.md'


2025-11-14 15:48:20,286 - INFO - Going to convert document batch...
2025-11-14 15:48:20,287 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 15:48:21,580 - INFO - Finished converting document 10-Q_2024-10-31 in 2.25 sec.
2025-11-14 15:48:22,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2024-10-31' --> 'data\processed_data\BMY\10-Q_2024-10-31.md'


2025-11-14 15:48:23,440 - INFO - Going to convert document batch...
2025-11-14 15:48:23,441 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 15:48:24,889 - INFO - Finished converting document 10-Q_2025-04-24 in 2.52 sec.
2025-11-14 15:48:25,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2025-04-24' --> 'data\processed_data\BMY\10-Q_2025-04-24.md'


2025-11-14 15:48:26,146 - INFO - Going to convert document batch...
2025-11-14 15:48:26,148 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 15:48:27,981 - INFO - Finished converting document 10-Q_2025-07-31 in 2.48 sec.
2025-11-14 15:48:28,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2025-07-31' --> 'data\processed_data\BMY\10-Q_2025-07-31.md'


2025-11-14 15:48:29,320 - INFO - Going to convert document batch...
2025-11-14 15:48:29,321 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 15:48:30,561 - INFO - Finished converting document 10-Q_2025-10-30 in 1.92 sec.
2025-11-14 15:48:31,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,534 - INFO - Going to convert document batch...
2025-11-14 15:48:31,535 - INFO - Processing document 4_2023-01-04
2025-11-14 15:48:31,554 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 15:48:31,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,636 - INFO - Going to convert document batch...
2025-11-14 15:48:31,637 - INFO - Processing document 4_2023-02-03
2025-11-14 15:48:31,661 - INFO - Finished converting document 4_2023-02-03 in 0.08 sec.


Converted 'data\edgar_documents\BMY\10-Q_2025-10-30' --> 'data\processed_data\BMY\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\BMY\4_2023-01-04' --> 'data\processed_data\BMY\4_2023-01-04.md'
Converted 'data\edgar_documents\BMY\4_2023-02-03' --> 'data\processed_data\BMY\4_2023-02-03.md'


2025-11-14 15:48:31,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,721 - INFO - Going to convert document batch...
2025-11-14 15:48:31,725 - INFO - Processing document 4_2023-02-08
2025-11-14 15:48:31,762 - INFO - Finished converting document 4_2023-02-08 in 0.08 sec.
2025-11-14 15:48:31,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,814 - INFO - Going to convert document batch...
2025-11-14 15:48:31,815 - INFO - Processing document 4_2023-03-14
2025-11-14 15:48:31,855 - INFO - Finished converting document 4_2023-03-14 in 0.08 sec.
2025-11-14 15:48:31,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,923 - INFO - Going to convert document batch...
2025-11-14 15:48:31,924 - INFO - Processing document 4_2023-04-04
2025-11-14 15:48:31,943 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.


Converted 'data\edgar_documents\BMY\4_2023-02-08' --> 'data\processed_data\BMY\4_2023-02-08.md'
Converted 'data\edgar_documents\BMY\4_2023-03-14' --> 'data\processed_data\BMY\4_2023-03-14.md'
Converted 'data\edgar_documents\BMY\4_2023-04-04' --> 'data\processed_data\BMY\4_2023-04-04.md'


2025-11-14 15:48:31,993 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,009 - INFO - Going to convert document batch...
2025-11-14 15:48:32,010 - INFO - Processing document 4_2023-05-03
2025-11-14 15:48:32,046 - INFO - Finished converting document 4_2023-05-03 in 0.08 sec.
2025-11-14 15:48:32,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,104 - INFO - Going to convert document batch...
2025-11-14 15:48:32,104 - INFO - Processing document 4_2023-05-04
2025-11-14 15:48:32,124 - INFO - Finished converting document 4_2023-05-04 in 0.05 sec.
2025-11-14 15:48:32,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,183 - INFO - Going to convert document batch...
2025-11-14 15:48:32,183 - INFO - Processing document 4_2023-06-06
2025-11-14 15:48:32,208 - INFO - Finished converting document 4_2023-06-06 in 0.05 sec.
2025-11-14 15:48:32,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\4_2023-05-03' --> 'data\processed_data\BMY\4_2023-05-03.md'
Converted 'data\edgar_documents\BMY\4_2023-05-04' --> 'data\processed_data\BMY\4_2023-05-04.md'
Converted 'data\edgar_documents\BMY\4_2023-06-06' --> 'data\processed_data\BMY\4_2023-06-06.md'


2025-11-14 15:48:32,277 - INFO - Going to convert document batch...
2025-11-14 15:48:32,279 - INFO - Processing document 4_2023-07-05
2025-11-14 15:48:32,305 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 15:48:32,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,370 - INFO - Going to convert document batch...
2025-11-14 15:48:32,371 - INFO - Processing document 4_2023-08-07
2025-11-14 15:48:32,392 - INFO - Finished converting document 4_2023-08-07 in 0.06 sec.
2025-11-14 15:48:32,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,433 - INFO - Going to convert document batch...
2025-11-14 15:48:32,434 - INFO - Processing document 4_2023-08-28
2025-11-14 15:48:32,463 - INFO - Finished converting document 4_2023-08-28 in 0.05 sec.
2025-11-14 15:48:32,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\4_2023-07-05' --> 'data\processed_data\BMY\4_2023-07-05.md'
Converted 'data\edgar_documents\BMY\4_2023-08-07' --> 'data\processed_data\BMY\4_2023-08-07.md'
Converted 'data\edgar_documents\BMY\4_2023-08-28' --> 'data\processed_data\BMY\4_2023-08-28.md'


2025-11-14 15:48:32,533 - INFO - Going to convert document batch...
2025-11-14 15:48:32,534 - INFO - Processing document 4_2023-10-03
2025-11-14 15:48:32,556 - INFO - Finished converting document 4_2023-10-03 in 0.06 sec.
2025-11-14 15:48:32,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,600 - INFO - Going to convert document batch...
2025-11-14 15:48:32,601 - INFO - Processing document 4_2023-10-04
2025-11-14 15:48:32,620 - INFO - Finished converting document 4_2023-10-04 in 0.05 sec.
2025-11-14 15:48:32,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,665 - INFO - Going to convert document batch...
2025-11-14 15:48:32,665 - INFO - Processing document 4_2023-10-12
2025-11-14 15:48:32,684 - INFO - Finished converting document 4_2023-10-12 in 0.05 sec.
2025-11-14 15:48:32,760 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BMY\4_2023-10-03' --> 'data\processed_data\BMY\4_2023-10-03.md'
Converted 'data\edgar_documents\BMY\4_2023-10-04' --> 'data\processed_data\BMY\4_2023-10-04.md'
Converted 'data\edgar_documents\BMY\4_2023-10-12' --> 'data\processed_data\BMY\4_2023-10-12.md'


2025-11-14 15:48:32,762 - ERROR - Input document 4_2023-10-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:32,763 - INFO - Going to convert document batch...
2025-11-14 15:48:32,788 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:32,789 - ERROR - Input document 4_2023-11-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\BMY\4_2023-10-30: File format not allowed: data\edgar_documents\BMY\4_2023-10-30
Error processing data\edgar_documents\BMY\4_2023-11-01: File format not allowed: data\edgar_documents\BMY\4_2023-11-01
Converted 'data\edgar_documents\BMY\4_2023-11-03' --> 'data\processed_data\BMY\4_2023-11-03.md'
Converted 'data\edgar_documents\BMY\4_2023-11-21' --> 'data\processed_data\BMY\4_2023-11-21.md'


2025-11-14 15:48:32,964 - INFO - Finished converting document 4_2023-11-24 in 0.05 sec.
2025-11-14 15:48:33,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,007 - INFO - Going to convert document batch...
2025-11-14 15:48:33,008 - INFO - Processing document 4_2023-11-30
2025-11-14 15:48:33,027 - INFO - Finished converting document 4_2023-11-30 in 0.05 sec.
2025-11-14 15:48:33,076 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,088 - INFO - Going to convert document batch...
2025-11-14 15:48:33,089 - INFO - Processing document 4_2023-12-05
2025-11-14 15:48:33,120 - INFO - Finished converting document 4_2023-12-05 in 0.08 sec.
2025-11-14 15:48:33,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,163 - INFO - Going to convert document batch...
2025-11-14 15:48:33,164 - INFO - Processing document 4_2023-12-07


Converted 'data\edgar_documents\BMY\4_2023-11-24' --> 'data\processed_data\BMY\4_2023-11-24.md'
Converted 'data\edgar_documents\BMY\4_2023-11-30' --> 'data\processed_data\BMY\4_2023-11-30.md'
Converted 'data\edgar_documents\BMY\4_2023-12-05' --> 'data\processed_data\BMY\4_2023-12-05.md'


2025-11-14 15:48:33,181 - INFO - Finished converting document 4_2023-12-07 in 0.03 sec.
2025-11-14 15:48:33,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,224 - INFO - Going to convert document batch...
2025-11-14 15:48:33,226 - INFO - Processing document 4_2024-01-03
2025-11-14 15:48:33,249 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:48:33,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,292 - INFO - Going to convert document batch...
2025-11-14 15:48:33,292 - INFO - Processing document 4_2024-02-05
2025-11-14 15:48:33,319 - INFO - Finished converting document 4_2024-02-05 in 0.05 sec.
2025-11-14 15:48:33,366 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:33,367 - ERROR - Input document 4_2024-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFo

Converted 'data\edgar_documents\BMY\4_2023-12-07' --> 'data\processed_data\BMY\4_2023-12-07.md'
Converted 'data\edgar_documents\BMY\4_2024-01-03' --> 'data\processed_data\BMY\4_2024-01-03.md'
Converted 'data\edgar_documents\BMY\4_2024-02-05' --> 'data\processed_data\BMY\4_2024-02-05.md'
Error processing data\edgar_documents\BMY\4_2024-02-13: File format not allowed: data\edgar_documents\BMY\4_2024-02-13


2025-11-14 15:48:33,396 - ERROR - Input document 4_2024-02-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:33,399 - INFO - Going to convert document batch...
2025-11-14 15:48:33,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,431 - INFO - Going to convert document batch...
2025-11-14 15:48:33,432 - INFO - Processing document 4_2024-03-04
2025-11-14 15:48:33,454 - INFO - Finished converting document 4_2024-03-04 in 0.06 sec.
2025-11-14 15:48:33,488 - INFO - detec

Error processing data\edgar_documents\BMY\4_2024-02-16: File format not allowed: data\edgar_documents\BMY\4_2024-02-16
Converted 'data\edgar_documents\BMY\4_2024-03-04' --> 'data\processed_data\BMY\4_2024-03-04.md'


2025-11-14 15:48:33,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,670 - INFO - Going to convert document batch...
2025-11-14 15:48:33,671 - INFO - Processing document 4_2024-04-02
2025-11-14 15:48:33,698 - INFO - Finished converting document 4_2024-04-02 in 0.06 sec.
2025-11-14 15:48:33,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,772 - INFO - Going to convert document batch...
2025-11-14 15:48:33,773 - INFO - Processing document 4_2024-05-03
2025-11-14 15:48:33,801 - INFO - Finished converting document 4_2024-05-03 in 0.08 sec.


Converted 'data\edgar_documents\BMY\4_2024-03-12' --> 'data\processed_data\BMY\4_2024-03-12.md'
Converted 'data\edgar_documents\BMY\4_2024-04-02' --> 'data\processed_data\BMY\4_2024-04-02.md'


2025-11-14 15:48:33,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,865 - INFO - Going to convert document batch...
2025-11-14 15:48:33,866 - INFO - Processing document 4_2024-07-02
2025-11-14 15:48:33,916 - INFO - Finished converting document 4_2024-07-02 in 0.09 sec.
2025-11-14 15:48:33,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,981 - INFO - Going to convert document batch...
2025-11-14 15:48:33,981 - INFO - Processing document 4_2024-07-31
2025-11-14 15:48:34,009 - INFO - Finished converting document 4_2024-07-31 in 0.05 sec.


Converted 'data\edgar_documents\BMY\4_2024-05-03' --> 'data\processed_data\BMY\4_2024-05-03.md'
Converted 'data\edgar_documents\BMY\4_2024-07-02' --> 'data\processed_data\BMY\4_2024-07-02.md'


2025-11-14 15:48:34,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,070 - INFO - Going to convert document batch...
2025-11-14 15:48:34,071 - INFO - Processing document 4_2024-08-05
2025-11-14 15:48:34,095 - INFO - Finished converting document 4_2024-08-05 in 0.05 sec.
2025-11-14 15:48:34,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,154 - INFO - Going to convert document batch...
2025-11-14 15:48:34,155 - INFO - Processing document 4_2024-10-02
2025-11-14 15:48:34,174 - INFO - Finished converting document 4_2024-10-02 in 0.06 sec.
2025-11-14 15:48:34,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,234 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BMY\4_2024-07-31' --> 'data\processed_data\BMY\4_2024-07-31.md'
Converted 'data\edgar_documents\BMY\4_2024-08-05' --> 'data\processed_data\BMY\4_2024-08-05.md'
Converted 'data\edgar_documents\BMY\4_2024-10-02' --> 'data\processed_data\BMY\4_2024-10-02.md'


2025-11-14 15:48:34,236 - INFO - Processing document 4_2024-10-03
2025-11-14 15:48:34,258 - INFO - Finished converting document 4_2024-10-03 in 0.06 sec.
2025-11-14 15:48:34,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,301 - INFO - Going to convert document batch...
2025-11-14 15:48:34,301 - INFO - Processing document 4_2024-11-05
2025-11-14 15:48:34,318 - INFO - Finished converting document 4_2024-11-05 in 0.03 sec.
2025-11-14 15:48:34,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,380 - INFO - Going to convert document batch...
2025-11-14 15:48:34,381 - INFO - Processing document 4_2025-01-02
2025-11-14 15:48:34,401 - INFO - Finished converting document 4_2025-01-02 in 0.06 sec.
2025-11-14 15:48:34,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,467 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BMY\4_2024-10-03' --> 'data\processed_data\BMY\4_2024-10-03.md'
Converted 'data\edgar_documents\BMY\4_2024-11-05' --> 'data\processed_data\BMY\4_2024-11-05.md'
Converted 'data\edgar_documents\BMY\4_2025-01-02' --> 'data\processed_data\BMY\4_2025-01-02.md'


2025-11-14 15:48:34,468 - INFO - Processing document 4_2025-02-04
2025-11-14 15:48:34,514 - INFO - Finished converting document 4_2025-02-04 in 0.09 sec.
2025-11-14 15:48:34,556 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,570 - INFO - Going to convert document batch...
2025-11-14 15:48:34,571 - INFO - Processing document 4_2025-02-19
2025-11-14 15:48:34,591 - INFO - Finished converting document 4_2025-02-19 in 0.05 sec.
2025-11-14 15:48:34,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,632 - INFO - Going to convert document batch...
2025-11-14 15:48:34,633 - INFO - Processing document 4_2025-02-21
2025-11-14 15:48:34,652 - INFO - Finished converting document 4_2025-02-21 in 0.05 sec.
2025-11-14 15:48:34,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,694 - INFO - Going to convert document batch...
2025-11-14 15:48:34,695 - INFO - Processing document 4_2025-03-04
2025-11-14 15:48:34,717 - IN

Converted 'data\edgar_documents\BMY\4_2025-02-04' --> 'data\processed_data\BMY\4_2025-02-04.md'
Converted 'data\edgar_documents\BMY\4_2025-02-19' --> 'data\processed_data\BMY\4_2025-02-19.md'
Converted 'data\edgar_documents\BMY\4_2025-02-21' --> 'data\processed_data\BMY\4_2025-02-21.md'
Converted 'data\edgar_documents\BMY\4_2025-03-04' --> 'data\processed_data\BMY\4_2025-03-04.md'


2025-11-14 15:48:34,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,775 - INFO - Going to convert document batch...
2025-11-14 15:48:34,777 - INFO - Processing document 4_2025-03-12
2025-11-14 15:48:34,824 - INFO - Finished converting document 4_2025-03-12 in 0.09 sec.
2025-11-14 15:48:34,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,885 - INFO - Going to convert document batch...
2025-11-14 15:48:34,886 - INFO - Processing document 4_2025-04-01
2025-11-14 15:48:34,906 - INFO - Finished converting document 4_2025-04-01 in 0.05 sec.
2025-11-14 15:48:34,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,952 - INFO - Going to convert document batch...
2025-11-14 15:48:34,953 - INFO - Processing document 4_2025-04-03
2025-11-14 15:48:34,979 - INFO - Finished converting document 4_2025-04-03 in 0.06 sec.
2025-11-14 15:48:35,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\BMY\4_2025-03-12' --> 'data\processed_data\BMY\4_2025-03-12.md'
Converted 'data\edgar_documents\BMY\4_2025-04-01' --> 'data\processed_data\BMY\4_2025-04-01.md'
Converted 'data\edgar_documents\BMY\4_2025-04-03' --> 'data\processed_data\BMY\4_2025-04-03.md'


2025-11-14 15:48:35,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,106 - INFO - Going to convert document batch...
2025-11-14 15:48:35,109 - INFO - Processing document 4_2025-05-05
2025-11-14 15:48:35,166 - INFO - Finished converting document 4_2025-05-05 in 0.09 sec.
2025-11-14 15:48:35,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,215 - INFO - Going to convert document batch...
2025-11-14 15:48:35,217 - INFO - Processing document 4_2025-05-13
2025-11-14 15:48:35,242 - INFO - Finished converting document 4_2025-05-13 in 0.05 sec.


Converted 'data\edgar_documents\BMY\4_2025-04-29' --> 'data\processed_data\BMY\4_2025-04-29.md'
Converted 'data\edgar_documents\BMY\4_2025-05-05' --> 'data\processed_data\BMY\4_2025-05-05.md'


2025-11-14 15:48:35,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,299 - INFO - Going to convert document batch...
2025-11-14 15:48:35,299 - INFO - Processing document 4_2025-06-04
2025-11-14 15:48:35,323 - INFO - Finished converting document 4_2025-06-04 in 0.06 sec.
2025-11-14 15:48:35,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,392 - INFO - Going to convert document batch...
2025-11-14 15:48:35,392 - INFO - Processing document 4_2025-06-16
2025-11-14 15:48:35,413 - INFO - Finished converting document 4_2025-06-16 in 0.06 sec.


Converted 'data\edgar_documents\BMY\4_2025-05-13' --> 'data\processed_data\BMY\4_2025-05-13.md'
Converted 'data\edgar_documents\BMY\4_2025-06-04' --> 'data\processed_data\BMY\4_2025-06-04.md'
Converted 'data\edgar_documents\BMY\4_2025-06-16' --> 'data\processed_data\BMY\4_2025-06-16.md'


2025-11-14 15:48:35,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,456 - INFO - Going to convert document batch...
2025-11-14 15:48:35,457 - INFO - Processing document 4_2025-07-01
2025-11-14 15:48:35,477 - INFO - Finished converting document 4_2025-07-01 in 0.03 sec.
2025-11-14 15:48:35,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,522 - INFO - Going to convert document batch...
2025-11-14 15:48:35,524 - INFO - Processing document 4_2025-07-02
2025-11-14 15:48:35,543 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 15:48:35,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,601 - INFO - Going to convert document batch...
2025-11-14 15:48:35,602 - INFO - Processing document 4_2025-08-05
2025-11-14 15:48:35,622 - INFO - Finished converting document 4_2025-08-05 in 0.06 sec.
2025-11-14 15:48:35,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\BMY\4_2025-07-01' --> 'data\processed_data\BMY\4_2025-07-01.md'
Converted 'data\edgar_documents\BMY\4_2025-07-02' --> 'data\processed_data\BMY\4_2025-07-02.md'
Converted 'data\edgar_documents\BMY\4_2025-08-05' --> 'data\processed_data\BMY\4_2025-08-05.md'


2025-11-14 15:48:35,684 - INFO - Processing document 4_2025-09-03
2025-11-14 15:48:35,705 - INFO - Finished converting document 4_2025-09-03 in 0.06 sec.
2025-11-14 15:48:35,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,746 - INFO - Going to convert document batch...
2025-11-14 15:48:35,747 - INFO - Processing document 4_2025-10-02
2025-11-14 15:48:35,766 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 15:48:35,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,829 - INFO - Going to convert document batch...
2025-11-14 15:48:35,830 - INFO - Processing document 4_2025-10-06
2025-11-14 15:48:35,849 - INFO - Finished converting document 4_2025-10-06 in 0.06 sec.
2025-11-14 15:48:35,894 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:35,895 - ERROR - Input document 4_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>

Converted 'data\edgar_documents\BMY\4_2025-09-03' --> 'data\processed_data\BMY\4_2025-09-03.md'
Converted 'data\edgar_documents\BMY\4_2025-10-02' --> 'data\processed_data\BMY\4_2025-10-02.md'
Converted 'data\edgar_documents\BMY\4_2025-10-06' --> 'data\processed_data\BMY\4_2025-10-06.md'
Error processing data\edgar_documents\BMY\4_2025-11-03: File format not allowed: data\edgar_documents\BMY\4_2025-11-03


2025-11-14 15:48:35,918 - INFO - Going to convert document batch...
2025-11-14 15:48:35,919 - INFO - Processing document 4_2025-11-04
2025-11-14 15:48:35,943 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 15:48:35,991 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:35,992 - ERROR - Input document 4_2025-11-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:35,995 - INFO - Going to convert document batch...
2025-11-14 15:48:36,009 - IN

Converted 'data\edgar_documents\BMY\4_2025-11-04' --> 'data\processed_data\BMY\4_2025-11-04.md'
Error processing data\edgar_documents\BMY\4_2025-11-07: File format not allowed: data\edgar_documents\BMY\4_2025-11-07
Converted 'data\edgar_documents\BMY\8-K_2023-01-09' --> 'data\processed_data\BMY\8-K_2023-01-09.md'
Converted 'data\edgar_documents\BMY\8-K_2023-01-31' --> 'data\processed_data\BMY\8-K_2023-01-31.md'


2025-11-14 15:48:36,163 - INFO - Going to convert document batch...
2025-11-14 15:48:36,165 - INFO - Processing document 8-K_2023-02-02
2025-11-14 15:48:36,198 - INFO - Finished converting document 8-K_2023-02-02 in 0.08 sec.
2025-11-14 15:48:36,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,248 - INFO - Going to convert document batch...
2025-11-14 15:48:36,249 - INFO - Processing document 8-K_2023-02-28
2025-11-14 15:48:36,267 - INFO - Finished converting document 8-K_2023-02-28 in 0.05 sec.
2025-11-14 15:48:36,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,307 - INFO - Going to convert document batch...
2025-11-14 15:48:36,309 - INFO - Processing document 8-K_2023-04-26
2025-11-14 15:48:36,341 - INFO - Finished converting document 8-K_2023-04-26 in 0.06 sec.
2025-11-14 15:48:36,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,406 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BMY\8-K_2023-02-02' --> 'data\processed_data\BMY\8-K_2023-02-02.md'
Converted 'data\edgar_documents\BMY\8-K_2023-02-28' --> 'data\processed_data\BMY\8-K_2023-02-28.md'
Converted 'data\edgar_documents\BMY\8-K_2023-04-26' --> 'data\processed_data\BMY\8-K_2023-04-26.md'


2025-11-14 15:48:36,407 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:48:36,449 - INFO - Finished converting document 8-K_2023-04-27 in 0.09 sec.
2025-11-14 15:48:36,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,532 - INFO - Going to convert document batch...
2025-11-14 15:48:36,534 - INFO - Processing document 8-K_2023-05-04
2025-11-14 15:48:36,571 - INFO - Finished converting document 8-K_2023-05-04 in 0.09 sec.
2025-11-14 15:48:36,601 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,617 - INFO - Going to convert document batch...
2025-11-14 15:48:36,618 - INFO - Processing document 8-K_2023-07-27
2025-11-14 15:48:36,639 - INFO - Finished converting document 8-K_2023-07-27 in 0.06 sec.


Converted 'data\edgar_documents\BMY\8-K_2023-04-27' --> 'data\processed_data\BMY\8-K_2023-04-27.md'
Converted 'data\edgar_documents\BMY\8-K_2023-05-04' --> 'data\processed_data\BMY\8-K_2023-05-04.md'


2025-11-14 15:48:36,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,687 - INFO - Going to convert document batch...
2025-11-14 15:48:36,688 - INFO - Processing document 8-K_2023-08-10
2025-11-14 15:48:36,717 - INFO - Finished converting document 8-K_2023-08-10 in 0.06 sec.
2025-11-14 15:48:36,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,763 - INFO - Going to convert document batch...
2025-11-14 15:48:36,764 - INFO - Processing document 8-K_2023-10-26


Converted 'data\edgar_documents\BMY\8-K_2023-07-27' --> 'data\processed_data\BMY\8-K_2023-07-27.md'
Converted 'data\edgar_documents\BMY\8-K_2023-08-10' --> 'data\processed_data\BMY\8-K_2023-08-10.md'


2025-11-14 15:48:37,289 - INFO - Finished converting document 8-K_2023-10-26 in 0.55 sec.
2025-11-14 15:48:37,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,351 - INFO - Going to convert document batch...
2025-11-14 15:48:37,352 - INFO - Processing document 8-K_2023-10-31
2025-11-14 15:48:37,375 - INFO - Finished converting document 8-K_2023-10-31 in 0.06 sec.
2025-11-14 15:48:37,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,454 - INFO - Going to convert document batch...
2025-11-14 15:48:37,456 - INFO - Processing document 8-K_2023-11-13
2025-11-14 15:48:37,497 - INFO - Finished converting document 8-K_2023-11-13 in 0.11 sec.


Converted 'data\edgar_documents\BMY\8-K_2023-10-26' --> 'data\processed_data\BMY\8-K_2023-10-26.md'
Converted 'data\edgar_documents\BMY\8-K_2023-10-31' --> 'data\processed_data\BMY\8-K_2023-10-31.md'


2025-11-14 15:48:37,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,569 - INFO - Going to convert document batch...
2025-11-14 15:48:37,571 - INFO - Processing document 8-K_2023-12-22
2025-11-14 15:48:37,603 - INFO - Finished converting document 8-K_2023-12-22 in 0.08 sec.
2025-11-14 15:48:37,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,651 - INFO - Going to convert document batch...
2025-11-14 15:48:37,652 - INFO - Processing document 8-K_2024-01-08
2025-11-14 15:48:37,681 - INFO - Finished converting document 8-K_2024-01-08 in 0.06 sec.


Converted 'data\edgar_documents\BMY\8-K_2023-11-13' --> 'data\processed_data\BMY\8-K_2023-11-13.md'
Converted 'data\edgar_documents\BMY\8-K_2023-12-22' --> 'data\processed_data\BMY\8-K_2023-12-22.md'
Converted 'data\edgar_documents\BMY\8-K_2024-01-08' --> 'data\processed_data\BMY\8-K_2024-01-08.md'


2025-11-14 15:48:37,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,732 - INFO - Going to convert document batch...
2025-11-14 15:48:37,733 - INFO - Processing document 8-K_2024-02-02
2025-11-14 15:48:37,758 - INFO - Finished converting document 8-K_2024-02-02 in 0.06 sec.
2025-11-14 15:48:37,789 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:37,790 - ERROR - Input document 8-K_2024-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <I

Converted 'data\edgar_documents\BMY\8-K_2024-02-02' --> 'data\processed_data\BMY\8-K_2024-02-02.md'
Error processing data\edgar_documents\BMY\8-K_2024-02-14: File format not allowed: data\edgar_documents\BMY\8-K_2024-02-14
Error processing data\edgar_documents\BMY\8-K_2024-02-15: File format not allowed: data\edgar_documents\BMY\8-K_2024-02-15
Error processing data\edgar_documents\BMY\8-K_2024-02-22: File format not allowed: data\edgar_documents\BMY\8-K_2024-02-22
Error processing data\edgar_documents\BMY\8-K_2024-03-18: File format not allowed: data\edgar_documents\BMY\8-K_2024-03-18
Converted 'data\edgar_documents\BMY\8-K_2024-04-25' --> 'data\processed_data\BMY\8-K_2024-04-25.md'


2025-11-14 15:48:37,953 - ERROR - Input document 8-K_2024-05-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:37,954 - INFO - Going to convert document batch...
2025-11-14 15:48:37,970 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:37,971 - ERROR - Input document 8-K_2024-06-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, 

Error processing data\edgar_documents\BMY\8-K_2024-05-09: File format not allowed: data\edgar_documents\BMY\8-K_2024-05-09
Error processing data\edgar_documents\BMY\8-K_2024-06-18: File format not allowed: data\edgar_documents\BMY\8-K_2024-06-18
Converted 'data\edgar_documents\BMY\8-K_2024-07-26' --> 'data\processed_data\BMY\8-K_2024-07-26.md'
Converted 'data\edgar_documents\BMY\8-K_2024-10-31' --> 'data\processed_data\BMY\8-K_2024-10-31.md'
Error processing data\edgar_documents\BMY\8-K_2025-01-13: File format not allowed: data\edgar_documents\BMY\8-K_2025-01-13


2025-11-14 15:48:38,161 - INFO - Going to convert document batch...
2025-11-14 15:48:38,162 - INFO - Processing document 8-K_2025-02-06
2025-11-14 15:48:38,189 - INFO - Finished converting document 8-K_2025-02-06 in 0.06 sec.
2025-11-14 15:48:38,224 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:38,225 - ERROR - Input document 8-K_2025-02-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:38,227 - INFO - Going to convert docu

Converted 'data\edgar_documents\BMY\8-K_2025-02-06' --> 'data\processed_data\BMY\8-K_2025-02-06.md'
Error processing data\edgar_documents\BMY\8-K_2025-02-18: File format not allowed: data\edgar_documents\BMY\8-K_2025-02-18
Converted 'data\edgar_documents\BMY\8-K_2025-04-24' --> 'data\processed_data\BMY\8-K_2025-04-24.md'
Error processing data\edgar_documents\BMY\8-K_2025-05-07: File format not allowed: data\edgar_documents\BMY\8-K_2025-05-07
Error processing data\edgar_documents\BMY\8-K_2025-07-25: File format not allowed: data\edgar_documents\BMY\8-K_2025-07-25


2025-11-14 15:48:38,422 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:38,433 - INFO - Going to convert document batch...
2025-11-14 15:48:38,434 - INFO - Processing document 8-K_2025-10-30
2025-11-14 15:48:38,453 - INFO - Finished converting document 8-K_2025-10-30 in 0.05 sec.
2025-11-14 15:48:38,502 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:38,503 - ERROR - Input document 8-K_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <I

Converted 'data\edgar_documents\BMY\8-K_2025-07-31' --> 'data\processed_data\BMY\8-K_2025-07-31.md'
Converted 'data\edgar_documents\BMY\8-K_2025-10-30' --> 'data\processed_data\BMY\8-K_2025-10-30.md'
Error processing data\edgar_documents\BMY\8-K_2025-11-03: File format not allowed: data\edgar_documents\BMY\8-K_2025-11-03
Error processing data\edgar_documents\BMY\8-K_2025-11-10: File format not allowed: data\edgar_documents\BMY\8-K_2025-11-10


2025-11-14 15:48:39,337 - INFO - Going to convert document batch...
2025-11-14 15:48:39,338 - INFO - Processing document DEF-14A_2023-03-23
2025-11-14 15:48:44,016 - INFO - Finished converting document DEF-14A_2023-03-23 in 5.48 sec.
2025-11-14 15:48:44,742 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:44,743 - ERROR - Input document DEF-14A_2024-03-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:44,746 - INFO - Going to 

Converted 'data\edgar_documents\BMY\DEF-14A_2023-03-23' --> 'data\processed_data\BMY\DEF-14A_2023-03-23.md'
Error processing data\edgar_documents\BMY\DEF-14A_2024-03-28: File format not allowed: data\edgar_documents\BMY\DEF-14A_2024-03-28


2025-11-14 15:48:45,510 - INFO - Going to convert document batch...
2025-11-14 15:48:45,511 - INFO - Processing document DEF-14A_2025-03-26
2025-11-14 15:48:47,130 - INFO - Finished converting document DEF-14A_2025-03-26 in 2.38 sec.


Converted 'data\edgar_documents\BMY\DEF-14A_2025-03-26' --> 'data\processed_data\BMY\DEF-14A_2025-03-26.md'
Processed 88 new files. Errors: 19
Found 157 files to process in data\edgar_documents\BRK-B


2025-11-14 15:48:48,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:51,071 - INFO - Going to convert document batch...
2025-11-14 15:48:51,072 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:48:51,072 - INFO - Processing document 10-K_2023-02-27
2025-11-14 15:48:56,348 - INFO - Finished converting document 10-K_2023-02-27 in 8.42 sec.
2025-11-14 15:48:57,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-K_2023-02-27' --> 'data\processed_data\BRK-B\10-K_2023-02-27.md'


2025-11-14 15:49:00,635 - INFO - Going to convert document batch...
2025-11-14 15:49:00,636 - INFO - Processing document 10-K_2024-02-26
2025-11-14 15:49:07,623 - INFO - Finished converting document 10-K_2024-02-26 in 10.61 sec.


Converted 'data\edgar_documents\BRK-B\10-K_2024-02-26' --> 'data\processed_data\BRK-B\10-K_2024-02-26.md'


2025-11-14 15:49:09,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:49:17,866 - INFO - Going to convert document batch...
2025-11-14 15:49:17,867 - INFO - Processing document 10-K_2025-02-24
2025-11-14 15:49:31,422 - INFO - Finished converting document 10-K_2025-02-24 in 22.55 sec.
2025-11-14 15:49:33,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-K_2025-02-24' --> 'data\processed_data\BRK-B\10-K_2025-02-24.md'


2025-11-14 15:49:35,225 - INFO - Going to convert document batch...
2025-11-14 15:49:35,226 - INFO - Processing document 10-Q_2023-05-08
2025-11-14 15:49:37,897 - INFO - Finished converting document 10-Q_2023-05-08 in 4.83 sec.
2025-11-14 15:49:38,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2023-05-08' --> 'data\processed_data\BRK-B\10-Q_2023-05-08.md'


2025-11-14 15:49:40,006 - INFO - Going to convert document batch...
2025-11-14 15:49:40,007 - INFO - Processing document 10-Q_2023-08-07
2025-11-14 15:49:44,675 - INFO - Finished converting document 10-Q_2023-08-07 in 6.44 sec.
2025-11-14 15:49:45,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2023-08-07' --> 'data\processed_data\BRK-B\10-Q_2023-08-07.md'


2025-11-14 15:49:49,138 - INFO - Going to convert document batch...
2025-11-14 15:49:49,139 - INFO - Processing document 10-Q_2023-11-06
2025-11-14 15:49:51,898 - INFO - Finished converting document 10-Q_2023-11-06 in 6.28 sec.
2025-11-14 15:49:52,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2023-11-06' --> 'data\processed_data\BRK-B\10-Q_2023-11-06.md'


2025-11-14 15:49:53,603 - INFO - Going to convert document batch...
2025-11-14 15:49:53,604 - INFO - Processing document 10-Q_2024-05-06
2025-11-14 15:49:55,863 - INFO - Finished converting document 10-Q_2024-05-06 in 3.50 sec.
2025-11-14 15:49:56,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2024-05-06' --> 'data\processed_data\BRK-B\10-Q_2024-05-06.md'


2025-11-14 15:49:57,552 - INFO - Going to convert document batch...
2025-11-14 15:49:57,553 - INFO - Processing document 10-Q_2024-08-05
2025-11-14 15:50:00,260 - INFO - Finished converting document 10-Q_2024-08-05 in 4.09 sec.
2025-11-14 15:50:00,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2024-08-05' --> 'data\processed_data\BRK-B\10-Q_2024-08-05.md'


2025-11-14 15:50:03,475 - INFO - Going to convert document batch...
2025-11-14 15:50:03,476 - INFO - Processing document 10-Q_2024-11-04
2025-11-14 15:50:07,838 - INFO - Finished converting document 10-Q_2024-11-04 in 7.20 sec.
2025-11-14 15:50:08,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2024-11-04' --> 'data\processed_data\BRK-B\10-Q_2024-11-04.md'


2025-11-14 15:50:12,523 - INFO - Going to convert document batch...
2025-11-14 15:50:12,524 - INFO - Processing document 10-Q_2025-05-05
2025-11-14 15:50:15,999 - INFO - Finished converting document 10-Q_2025-05-05 in 7.45 sec.
2025-11-14 15:50:16,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2025-05-05' --> 'data\processed_data\BRK-B\10-Q_2025-05-05.md'


2025-11-14 15:50:21,553 - INFO - Going to convert document batch...
2025-11-14 15:50:21,554 - INFO - Processing document 10-Q_2025-08-04
2025-11-14 15:50:26,216 - INFO - Finished converting document 10-Q_2025-08-04 in 9.42 sec.
2025-11-14 15:50:27,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2025-08-04' --> 'data\processed_data\BRK-B\10-Q_2025-08-04.md'


2025-11-14 15:50:31,791 - INFO - Going to convert document batch...
2025-11-14 15:50:31,793 - INFO - Processing document 10-Q_2025-11-03
2025-11-14 15:50:36,374 - INFO - Finished converting document 10-Q_2025-11-03 in 9.27 sec.
2025-11-14 15:50:37,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:37,396 - INFO - Going to convert document batch...
2025-11-14 15:50:37,398 - INFO - Processing document 4_2023-02-24
2025-11-14 15:50:37,466 - INFO - Finished converting document 4_2023-02-24 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\10-Q_2025-11-03' --> 'data\processed_data\BRK-B\10-Q_2025-11-03.md'


2025-11-14 15:50:37,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:37,569 - INFO - Going to convert document batch...
2025-11-14 15:50:37,571 - INFO - Processing document 4_2023-03-03
2025-11-14 15:50:37,634 - INFO - Finished converting document 4_2023-03-03 in 0.09 sec.
2025-11-14 15:50:37,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-02-24' --> 'data\processed_data\BRK-B\4_2023-02-24.md'
Converted 'data\edgar_documents\BRK-B\4_2023-03-03' --> 'data\processed_data\BRK-B\4_2023-03-03.md'


2025-11-14 15:50:37,762 - INFO - Going to convert document batch...
2025-11-14 15:50:37,765 - INFO - Processing document 4_2023-03-07
2025-11-14 15:50:37,875 - INFO - Finished converting document 4_2023-03-07 in 0.19 sec.
2025-11-14 15:50:37,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:38,023 - INFO - Going to convert document batch...
2025-11-14 15:50:38,024 - INFO - Processing document 4_2023-03-15
2025-11-14 15:50:38,158 - INFO - Finished converting document 4_2023-03-15 in 0.20 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-03-07' --> 'data\processed_data\BRK-B\4_2023-03-07.md'


2025-11-14 15:50:38,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:38,281 - INFO - Going to convert document batch...
2025-11-14 15:50:38,282 - INFO - Processing document 4_2023-03-21
2025-11-14 15:50:38,338 - INFO - Finished converting document 4_2023-03-21 in 0.09 sec.
2025-11-14 15:50:38,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-03-15' --> 'data\processed_data\BRK-B\4_2023-03-15.md'
Converted 'data\edgar_documents\BRK-B\4_2023-03-21' --> 'data\processed_data\BRK-B\4_2023-03-21.md'


2025-11-14 15:50:38,463 - INFO - Going to convert document batch...
2025-11-14 15:50:38,466 - INFO - Processing document 4_2023-03-27
2025-11-14 15:50:38,559 - INFO - Finished converting document 4_2023-03-27 in 0.16 sec.
2025-11-14 15:50:38,654 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:38,655 - ERROR - Input document 4_2023-04-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:38,657 - INFO - Going to convert document batch...
2025-11-14 15:50:38,676 - IN

Converted 'data\edgar_documents\BRK-B\4_2023-03-27' --> 'data\processed_data\BRK-B\4_2023-03-27.md'
Error processing data\edgar_documents\BRK-B\4_2023-04-05: File format not allowed: data\edgar_documents\BRK-B\4_2023-04-05
Error processing data\edgar_documents\BRK-B\4_2023-04-17: File format not allowed: data\edgar_documents\BRK-B\4_2023-04-17


2025-11-14 15:50:38,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:38,942 - INFO - Going to convert document batch...
2025-11-14 15:50:38,944 - INFO - Processing document 4_2023-05-15


Converted 'data\edgar_documents\BRK-B\4_2023-05-12' --> 'data\processed_data\BRK-B\4_2023-05-12.md'


2025-11-14 15:50:39,080 - INFO - Finished converting document 4_2023-05-15 in 0.22 sec.
2025-11-14 15:50:39,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:39,238 - INFO - Going to convert document batch...
2025-11-14 15:50:39,239 - INFO - Processing document 4_2023-05-18
2025-11-14 15:50:39,317 - INFO - Finished converting document 4_2023-05-18 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-05-15' --> 'data\processed_data\BRK-B\4_2023-05-15.md'
Converted 'data\edgar_documents\BRK-B\4_2023-05-18' --> 'data\processed_data\BRK-B\4_2023-05-18.md'


2025-11-14 15:50:39,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:39,448 - INFO - Going to convert document batch...
2025-11-14 15:50:39,449 - INFO - Processing document 4_2023-05-30
2025-11-14 15:50:39,528 - INFO - Finished converting document 4_2023-05-30 in 0.14 sec.
2025-11-14 15:50:39,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:39,642 - INFO - Going to convert document batch...
2025-11-14 15:50:39,643 - INFO - Processing document 4_2023-06-09
2025-11-14 15:50:39,703 - INFO - Finished converting document 4_2023-06-09 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-05-30' --> 'data\processed_data\BRK-B\4_2023-05-30.md'


2025-11-14 15:50:39,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:39,823 - INFO - Going to convert document batch...
2025-11-14 15:50:39,824 - INFO - Processing document 4_2023-06-22
2025-11-14 15:50:39,885 - INFO - Finished converting document 4_2023-06-22 in 0.11 sec.
2025-11-14 15:50:39,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-06-09' --> 'data\processed_data\BRK-B\4_2023-06-09.md'
Converted 'data\edgar_documents\BRK-B\4_2023-06-22' --> 'data\processed_data\BRK-B\4_2023-06-22.md'


2025-11-14 15:50:40,028 - INFO - Going to convert document batch...
2025-11-14 15:50:40,029 - INFO - Processing document 4_2023-06-28
2025-11-14 15:50:40,106 - INFO - Finished converting document 4_2023-06-28 in 0.16 sec.
2025-11-14 15:50:40,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,220 - INFO - Going to convert document batch...
2025-11-14 15:50:40,221 - INFO - Processing document 4_2023-06-30
2025-11-14 15:50:40,273 - INFO - Finished converting document 4_2023-06-30 in 0.08 sec.
2025-11-14 15:50:40,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,376 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2023-06-28' --> 'data\processed_data\BRK-B\4_2023-06-28.md'
Converted 'data\edgar_documents\BRK-B\4_2023-06-30' --> 'data\processed_data\BRK-B\4_2023-06-30.md'


2025-11-14 15:50:40,377 - INFO - Processing document 4_2023-08-10
2025-11-14 15:50:40,424 - INFO - Finished converting document 4_2023-08-10 in 0.09 sec.
2025-11-14 15:50:40,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,526 - INFO - Going to convert document batch...
2025-11-14 15:50:40,527 - INFO - Processing document 4_2023-08-15
2025-11-14 15:50:40,569 - INFO - Finished converting document 4_2023-08-15 in 0.09 sec.
2025-11-14 15:50:40,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-08-10' --> 'data\processed_data\BRK-B\4_2023-08-10.md'
Converted 'data\edgar_documents\BRK-B\4_2023-08-15' --> 'data\processed_data\BRK-B\4_2023-08-15.md'


2025-11-14 15:50:40,658 - INFO - Going to convert document batch...
2025-11-14 15:50:40,660 - INFO - Processing document 4_2023-08-16
2025-11-14 15:50:40,712 - INFO - Finished converting document 4_2023-08-16 in 0.09 sec.
2025-11-14 15:50:40,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,793 - INFO - Going to convert document batch...
2025-11-14 15:50:40,794 - INFO - Processing document 4_2023-08-17
2025-11-14 15:50:40,848 - INFO - Finished converting document 4_2023-08-17 in 0.09 sec.
2025-11-14 15:50:40,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,931 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2023-08-16' --> 'data\processed_data\BRK-B\4_2023-08-16.md'
Converted 'data\edgar_documents\BRK-B\4_2023-08-17' --> 'data\processed_data\BRK-B\4_2023-08-17.md'


2025-11-14 15:50:40,932 - INFO - Processing document 4_2023-09-08
2025-11-14 15:50:41,002 - INFO - Finished converting document 4_2023-09-08 in 0.11 sec.
2025-11-14 15:50:41,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:41,111 - INFO - Going to convert document batch...
2025-11-14 15:50:41,112 - INFO - Processing document 4_2023-09-13
2025-11-14 15:50:41,180 - INFO - Finished converting document 4_2023-09-13 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-09-08' --> 'data\processed_data\BRK-B\4_2023-09-08.md'
Converted 'data\edgar_documents\BRK-B\4_2023-09-13' --> 'data\processed_data\BRK-B\4_2023-09-13.md'


2025-11-14 15:50:41,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:41,314 - INFO - Going to convert document batch...
2025-11-14 15:50:41,315 - INFO - Processing document 4_2023-09-22
2025-11-14 15:50:41,393 - INFO - Finished converting document 4_2023-09-22 in 0.14 sec.
2025-11-14 15:50:41,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:41,494 - INFO - Going to convert document batch...
2025-11-14 15:50:41,495 - INFO - Processing document 4_2023-09-27
2025-11-14 15:50:41,561 - INFO - Finished converting document 4_2023-09-27 in 0.11 sec.
2025-11-14 15:50:41,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-09-22' --> 'data\processed_data\BRK-B\4_2023-09-22.md'
Converted 'data\edgar_documents\BRK-B\4_2023-09-27' --> 'data\processed_data\BRK-B\4_2023-09-27.md'


2025-11-14 15:50:41,657 - INFO - Going to convert document batch...
2025-11-14 15:50:41,658 - INFO - Processing document 4_2023-10-02
2025-11-14 15:50:41,727 - INFO - Finished converting document 4_2023-10-02 in 0.11 sec.
2025-11-14 15:50:41,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:41,832 - INFO - Going to convert document batch...
2025-11-14 15:50:41,833 - INFO - Processing document 4_2023-10-05
2025-11-14 15:50:41,890 - INFO - Finished converting document 4_2023-10-05 in 0.11 sec.
2025-11-14 15:50:41,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-10-02' --> 'data\processed_data\BRK-B\4_2023-10-02.md'
Converted 'data\edgar_documents\BRK-B\4_2023-10-05' --> 'data\processed_data\BRK-B\4_2023-10-05.md'


2025-11-14 15:50:41,982 - INFO - Going to convert document batch...
2025-11-14 15:50:41,983 - INFO - Processing document 4_2023-10-25
2025-11-14 15:50:42,047 - INFO - Finished converting document 4_2023-10-25 in 0.11 sec.
2025-11-14 15:50:42,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:42,168 - INFO - Going to convert document batch...
2025-11-14 15:50:42,171 - INFO - Processing document 4_2023-10-30
2025-11-14 15:50:42,267 - INFO - Finished converting document 4_2023-10-30 in 0.16 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-10-25' --> 'data\processed_data\BRK-B\4_2023-10-25.md'


2025-11-14 15:50:42,359 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:42,360 - ERROR - Input document 4_2023-11-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:42,362 - INFO - Going to convert document batch...
2025-11-14 15:50:42,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:42,400 - INFO - Going to convert document batch...
2025-11-14 15:50:42,402 - INFO - Processing document 4_2023-11-13
2025-11-14 15:50:42,452 - INFO - Fin

Converted 'data\edgar_documents\BRK-B\4_2023-10-30' --> 'data\processed_data\BRK-B\4_2023-10-30.md'
Error processing data\edgar_documents\BRK-B\4_2023-11-08: File format not allowed: data\edgar_documents\BRK-B\4_2023-11-08
Converted 'data\edgar_documents\BRK-B\4_2023-11-13' --> 'data\processed_data\BRK-B\4_2023-11-13.md'
Error processing data\edgar_documents\BRK-B\4_2023-11-20: File format not allowed: data\edgar_documents\BRK-B\4_2023-11-20


2025-11-14 15:50:42,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:42,562 - INFO - Going to convert document batch...
2025-11-14 15:50:42,563 - INFO - Processing document 4_2023-11-21
2025-11-14 15:50:42,627 - INFO - Finished converting document 4_2023-11-21 in 0.09 sec.
2025-11-14 15:50:42,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:42,716 - INFO - Going to convert document batch...
2025-11-14 15:50:42,717 - INFO - Processing document 4_2023-11-27
2025-11-14 15:50:42,776 - INFO - Finished converting document 4_2023-11-27 in 0.11 sec.
2025-11-14 15:50:42,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-11-21' --> 'data\processed_data\BRK-B\4_2023-11-21.md'
Converted 'data\edgar_documents\BRK-B\4_2023-11-27' --> 'data\processed_data\BRK-B\4_2023-11-27.md'


2025-11-14 15:50:44,201 - INFO - Going to convert document batch...
2025-11-14 15:50:44,202 - INFO - Processing document 4_2023-12-13
2025-11-14 15:50:44,285 - INFO - Finished converting document 4_2023-12-13 in 1.45 sec.
2025-11-14 15:50:44,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:44,386 - INFO - Going to convert document batch...
2025-11-14 15:50:44,388 - INFO - Processing document 4_2023-12-14
2025-11-14 15:50:44,454 - INFO - Finished converting document 4_2023-12-14 in 0.11 sec.
2025-11-14 15:50:44,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-12-13' --> 'data\processed_data\BRK-B\4_2023-12-13.md'
Converted 'data\edgar_documents\BRK-B\4_2023-12-14' --> 'data\processed_data\BRK-B\4_2023-12-14.md'


2025-11-14 15:50:44,556 - INFO - Going to convert document batch...
2025-11-14 15:50:44,557 - INFO - Processing document 4_2023-12-18
2025-11-14 15:50:44,612 - INFO - Finished converting document 4_2023-12-18 in 0.11 sec.
2025-11-14 15:50:44,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:44,704 - INFO - Going to convert document batch...
2025-11-14 15:50:44,705 - INFO - Processing document 4_2023-12-21
2025-11-14 15:50:44,789 - INFO - Finished converting document 4_2023-12-21 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-12-18' --> 'data\processed_data\BRK-B\4_2023-12-18.md'
Converted 'data\edgar_documents\BRK-B\4_2023-12-21' --> 'data\processed_data\BRK-B\4_2023-12-21.md'


2025-11-14 15:50:44,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:44,912 - INFO - Going to convert document batch...
2025-11-14 15:50:44,913 - INFO - Processing document 4_2024-01-04
2025-11-14 15:50:44,980 - INFO - Finished converting document 4_2024-01-04 in 0.12 sec.
2025-11-14 15:50:45,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:45,077 - INFO - Going to convert document batch...
2025-11-14 15:50:45,079 - INFO - Processing document 4_2024-01-12
2025-11-14 15:50:45,134 - INFO - Finished converting document 4_2024-01-12 in 0.09 sec.
2025-11-14 15:50:45,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-01-04' --> 'data\processed_data\BRK-B\4_2024-01-04.md'
Converted 'data\edgar_documents\BRK-B\4_2024-01-12' --> 'data\processed_data\BRK-B\4_2024-01-12.md'


2025-11-14 15:50:45,229 - INFO - Going to convert document batch...
2025-11-14 15:50:45,231 - INFO - Processing document 4_2024-01-17
2025-11-14 15:50:45,312 - INFO - Finished converting document 4_2024-01-17 in 0.12 sec.
2025-11-14 15:50:45,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:45,429 - INFO - Going to convert document batch...
2025-11-14 15:50:45,431 - INFO - Processing document 4_2024-01-18
2025-11-14 15:50:45,561 - INFO - Finished converting document 4_2024-01-18 in 0.17 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-01-17' --> 'data\processed_data\BRK-B\4_2024-01-17.md'


2025-11-14 15:50:45,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:45,690 - INFO - Going to convert document batch...
2025-11-14 15:50:45,691 - INFO - Processing document 4_2024-01-25
2025-11-14 15:50:45,767 - INFO - Finished converting document 4_2024-01-25 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-01-18' --> 'data\processed_data\BRK-B\4_2024-01-18.md'
Converted 'data\edgar_documents\BRK-B\4_2024-01-25' --> 'data\processed_data\BRK-B\4_2024-01-25.md'


2025-11-14 15:50:45,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:45,886 - INFO - Going to convert document batch...
2025-11-14 15:50:45,888 - INFO - Processing document 4_2024-02-01
2025-11-14 15:50:45,978 - INFO - Finished converting document 4_2024-02-01 in 0.16 sec.
2025-11-14 15:50:46,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,081 - INFO - Going to convert document batch...
2025-11-14 15:50:46,083 - INFO - Processing document 4_2024-02-05
2025-11-14 15:50:46,167 - INFO - Finished converting document 4_2024-02-05 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-02-01' --> 'data\processed_data\BRK-B\4_2024-02-01.md'


2025-11-14 15:50:46,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,280 - INFO - Going to convert document batch...
2025-11-14 15:50:46,282 - INFO - Processing document 4_2024-03-06
2025-11-14 15:50:46,344 - INFO - Finished converting document 4_2024-03-06 in 0.11 sec.
2025-11-14 15:50:46,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-02-05' --> 'data\processed_data\BRK-B\4_2024-02-05.md'
Converted 'data\edgar_documents\BRK-B\4_2024-03-06' --> 'data\processed_data\BRK-B\4_2024-03-06.md'


2025-11-14 15:50:46,438 - INFO - Going to convert document batch...
2025-11-14 15:50:46,439 - INFO - Processing document 4_2024-03-12
2025-11-14 15:50:46,503 - INFO - Finished converting document 4_2024-03-12 in 0.09 sec.
2025-11-14 15:50:46,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,593 - INFO - Going to convert document batch...
2025-11-14 15:50:46,594 - INFO - Processing document 4_2024-03-25
2025-11-14 15:50:46,687 - INFO - Finished converting document 4_2024-03-25 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-03-12' --> 'data\processed_data\BRK-B\4_2024-03-12.md'
Converted 'data\edgar_documents\BRK-B\4_2024-03-25' --> 'data\processed_data\BRK-B\4_2024-03-25.md'


2025-11-14 15:50:46,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,783 - INFO - Going to convert document batch...
2025-11-14 15:50:46,785 - INFO - Processing document 4_2024-03-28
2025-11-14 15:50:46,849 - INFO - Finished converting document 4_2024-03-28 in 0.11 sec.
2025-11-14 15:50:46,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,940 - INFO - Going to convert document batch...
2025-11-14 15:50:46,942 - INFO - Processing document 4_2024-04-08
2025-11-14 15:50:47,013 - INFO - Finished converting document 4_2024-04-08 in 0.11 sec.
2025-11-14 15:50:47,114 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BRK-B\4_2024-03-28' --> 'data\processed_data\BRK-B\4_2024-03-28.md'
Converted 'data\edgar_documents\BRK-B\4_2024-04-08' --> 'data\processed_data\BRK-B\4_2024-04-08.md'


2025-11-14 15:50:47,115 - ERROR - Input document 4_2024-04-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:47,117 - INFO - Going to convert document batch...
2025-11-14 15:50:47,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:47,159 - INFO - Going to convert document batch...
2025-11-14 15:50:47,160 - INFO - Processing document 4_2024-04-12
2025-11-14 15:50:47,220 - INFO - Finished converting document 4_2024-04-12 in 0.09 sec.
2025-11-14 15:50:47,297 - INFO - detec

Error processing data\edgar_documents\BRK-B\4_2024-04-09: File format not allowed: data\edgar_documents\BRK-B\4_2024-04-09
Converted 'data\edgar_documents\BRK-B\4_2024-04-12' --> 'data\processed_data\BRK-B\4_2024-04-12.md'
Error processing data\edgar_documents\BRK-B\4_2024-04-22: File format not allowed: data\edgar_documents\BRK-B\4_2024-04-22


2025-11-14 15:50:47,342 - INFO - Going to convert document batch...
2025-11-14 15:50:47,344 - INFO - Processing document 4_2024-04-26
2025-11-14 15:50:47,410 - INFO - Finished converting document 4_2024-04-26 in 0.11 sec.
2025-11-14 15:50:47,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:47,500 - INFO - Going to convert document batch...
2025-11-14 15:50:47,501 - INFO - Processing document 4_2024-05-01
2025-11-14 15:50:47,556 - INFO - Finished converting document 4_2024-05-01 in 0.09 sec.
2025-11-14 15:50:47,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:47,645 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-04-26' --> 'data\processed_data\BRK-B\4_2024-04-26.md'
Converted 'data\edgar_documents\BRK-B\4_2024-05-01' --> 'data\processed_data\BRK-B\4_2024-05-01.md'


2025-11-14 15:50:47,646 - INFO - Processing document 4_2024-05-17
2025-11-14 15:50:47,705 - INFO - Finished converting document 4_2024-05-17 in 0.09 sec.
2025-11-14 15:50:47,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:47,795 - INFO - Going to convert document batch...
2025-11-14 15:50:47,796 - INFO - Processing document 4_2024-06-07
2025-11-14 15:50:47,880 - INFO - Finished converting document 4_2024-06-07 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-05-17' --> 'data\processed_data\BRK-B\4_2024-05-17.md'
Converted 'data\edgar_documents\BRK-B\4_2024-06-07' --> 'data\processed_data\BRK-B\4_2024-06-07.md'


2025-11-14 15:50:47,975 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,008 - INFO - Going to convert document batch...
2025-11-14 15:50:48,009 - INFO - Processing document 4_2024-06-12
2025-11-14 15:50:48,075 - INFO - Finished converting document 4_2024-06-12 in 0.12 sec.
2025-11-14 15:50:48,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,169 - INFO - Going to convert document batch...
2025-11-14 15:50:48,171 - INFO - Processing document 4_2024-06-17
2025-11-14 15:50:48,236 - INFO - Finished converting document 4_2024-06-17 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-06-12' --> 'data\processed_data\BRK-B\4_2024-06-12.md'
Converted 'data\edgar_documents\BRK-B\4_2024-06-17' --> 'data\processed_data\BRK-B\4_2024-06-17.md'


2025-11-14 15:50:48,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,356 - INFO - Going to convert document batch...
2025-11-14 15:50:48,357 - INFO - Processing document 4_2024-06-20
2025-11-14 15:50:48,427 - INFO - Finished converting document 4_2024-06-20 in 0.12 sec.
2025-11-14 15:50:48,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,550 - INFO - Going to convert document batch...
2025-11-14 15:50:48,551 - INFO - Processing document 4_2024-06-28
2025-11-14 15:50:48,605 - INFO - Finished converting document 4_2024-06-28 in 0.09 sec.
2025-11-14 15:50:48,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,699 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-06-20' --> 'data\processed_data\BRK-B\4_2024-06-20.md'
Converted 'data\edgar_documents\BRK-B\4_2024-06-28' --> 'data\processed_data\BRK-B\4_2024-06-28.md'


2025-11-14 15:50:48,701 - INFO - Processing document 4_2024-07-02
2025-11-14 15:50:48,745 - INFO - Finished converting document 4_2024-07-02 in 0.09 sec.
2025-11-14 15:50:48,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,844 - INFO - Going to convert document batch...
2025-11-14 15:50:48,845 - INFO - Processing document 4_2024-07-19
2025-11-14 15:50:48,915 - INFO - Finished converting document 4_2024-07-19 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-07-02' --> 'data\processed_data\BRK-B\4_2024-07-02.md'


2025-11-14 15:50:48,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:49,006 - INFO - Going to convert document batch...
2025-11-14 15:50:49,007 - INFO - Processing document 4_2024-07-24
2025-11-14 15:50:49,067 - INFO - Finished converting document 4_2024-07-24 in 0.09 sec.
2025-11-14 15:50:49,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:49,177 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-07-19' --> 'data\processed_data\BRK-B\4_2024-07-19.md'
Converted 'data\edgar_documents\BRK-B\4_2024-07-24' --> 'data\processed_data\BRK-B\4_2024-07-24.md'


2025-11-14 15:50:49,178 - INFO - Processing document 4_2024-07-29
2025-11-14 15:50:49,255 - INFO - Finished converting document 4_2024-07-29 in 0.14 sec.
2025-11-14 15:50:49,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:49,365 - INFO - Going to convert document batch...
2025-11-14 15:50:49,366 - INFO - Processing document 4_2024-08-01
2025-11-14 15:50:49,447 - INFO - Finished converting document 4_2024-08-01 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-07-29' --> 'data\processed_data\BRK-B\4_2024-07-29.md'


2025-11-14 15:50:49,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:49,550 - INFO - Going to convert document batch...
2025-11-14 15:50:49,551 - INFO - Processing document 4_2024-08-19
2025-11-14 15:50:49,616 - INFO - Finished converting document 4_2024-08-19 in 0.09 sec.
2025-11-14 15:50:49,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-08-01' --> 'data\processed_data\BRK-B\4_2024-08-01.md'
Converted 'data\edgar_documents\BRK-B\4_2024-08-19' --> 'data\processed_data\BRK-B\4_2024-08-19.md'


2025-11-14 15:50:49,726 - INFO - Going to convert document batch...
2025-11-14 15:50:49,727 - INFO - Processing document 4_2024-08-27
2025-11-14 15:50:49,795 - INFO - Finished converting document 4_2024-08-27 in 0.12 sec.
2025-11-14 15:50:49,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-08-27' --> 'data\processed_data\BRK-B\4_2024-08-27.md'


2025-11-14 15:50:50,321 - INFO - Going to convert document batch...
2025-11-14 15:50:50,323 - INFO - Processing document 4_2024-08-30
2025-11-14 15:50:50,390 - INFO - Finished converting document 4_2024-08-30 in 0.55 sec.
2025-11-14 15:50:50,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:50,495 - INFO - Going to convert document batch...
2025-11-14 15:50:50,496 - INFO - Processing document 4_2024-09-05
2025-11-14 15:50:50,576 - INFO - Finished converting document 4_2024-09-05 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-08-30' --> 'data\processed_data\BRK-B\4_2024-08-30.md'
Converted 'data\edgar_documents\BRK-B\4_2024-09-05' --> 'data\processed_data\BRK-B\4_2024-09-05.md'


2025-11-14 15:50:50,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:50,693 - INFO - Going to convert document batch...
2025-11-14 15:50:50,694 - INFO - Processing document 4_2024-09-10
2025-11-14 15:50:50,758 - INFO - Finished converting document 4_2024-09-10 in 0.12 sec.
2025-11-14 15:50:50,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:50,861 - INFO - Going to convert document batch...
2025-11-14 15:50:50,862 - INFO - Processing document 4_2024-09-11
2025-11-14 15:50:50,928 - INFO - Finished converting document 4_2024-09-11 in 0.09 sec.
2025-11-14 15:50:50,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-09-10' --> 'data\processed_data\BRK-B\4_2024-09-10.md'
Converted 'data\edgar_documents\BRK-B\4_2024-09-11' --> 'data\processed_data\BRK-B\4_2024-09-11.md'


2025-11-14 15:50:51,021 - INFO - Going to convert document batch...
2025-11-14 15:50:51,022 - INFO - Processing document 4_2024-09-12
2025-11-14 15:50:51,085 - INFO - Finished converting document 4_2024-09-12 in 0.09 sec.
2025-11-14 15:50:51,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:51,200 - INFO - Going to convert document batch...
2025-11-14 15:50:51,201 - INFO - Processing document 4_2024-09-13
2025-11-14 15:50:51,263 - INFO - Finished converting document 4_2024-09-13 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-09-12' --> 'data\processed_data\BRK-B\4_2024-09-12.md'
Converted 'data\edgar_documents\BRK-B\4_2024-09-13' --> 'data\processed_data\BRK-B\4_2024-09-13.md'


2025-11-14 15:50:51,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:51,396 - INFO - Going to convert document batch...
2025-11-14 15:50:51,397 - INFO - Processing document 4_2024-09-19
2025-11-14 15:50:51,473 - INFO - Finished converting document 4_2024-09-19 in 0.14 sec.
2025-11-14 15:50:51,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:51,569 - INFO - Going to convert document batch...
2025-11-14 15:50:51,570 - INFO - Processing document 4_2024-09-24
2025-11-14 15:50:51,639 - INFO - Finished converting document 4_2024-09-24 in 0.11 sec.
2025-11-14 15:50:51,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-09-19' --> 'data\processed_data\BRK-B\4_2024-09-19.md'
Converted 'data\edgar_documents\BRK-B\4_2024-09-24' --> 'data\processed_data\BRK-B\4_2024-09-24.md'


2025-11-14 15:50:51,740 - INFO - Going to convert document batch...
2025-11-14 15:50:51,742 - INFO - Processing document 4_2024-09-27
2025-11-14 15:50:51,812 - INFO - Finished converting document 4_2024-09-27 in 0.11 sec.
2025-11-14 15:50:51,886 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:51,886 - ERROR - Input document 4_2024-10-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:51,889 - INFO - Going to convert document batch...
2025-11-14 15:50:51,901 - IN

Converted 'data\edgar_documents\BRK-B\4_2024-09-27' --> 'data\processed_data\BRK-B\4_2024-09-27.md'
Error processing data\edgar_documents\BRK-B\4_2024-10-01: File format not allowed: data\edgar_documents\BRK-B\4_2024-10-01
Converted 'data\edgar_documents\BRK-B\4_2024-10-02' --> 'data\processed_data\BRK-B\4_2024-10-02.md'


2025-11-14 15:50:52,079 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,113 - INFO - Going to convert document batch...
2025-11-14 15:50:52,115 - INFO - Processing document 4_2024-10-07
2025-11-14 15:50:52,188 - INFO - Finished converting document 4_2024-10-07 in 0.14 sec.
2025-11-14 15:50:52,253 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,289 - INFO - Going to convert document batch...
2025-11-14 15:50:52,290 - INFO - Processing document 4_2024-10-10
2025-11-14 15:50:52,371 - INFO - Finished converting document 4_2024-10-10 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-10-07' --> 'data\processed_data\BRK-B\4_2024-10-07.md'
Converted 'data\edgar_documents\BRK-B\4_2024-10-10' --> 'data\processed_data\BRK-B\4_2024-10-10.md'


2025-11-14 15:50:52,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,503 - INFO - Going to convert document batch...
2025-11-14 15:50:52,508 - INFO - Processing document 4_2024-10-11
2025-11-14 15:50:52,584 - INFO - Finished converting document 4_2024-10-11 in 0.14 sec.
2025-11-14 15:50:52,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,680 - INFO - Going to convert document batch...
2025-11-14 15:50:52,681 - INFO - Processing document 4_2024-10-17
2025-11-14 15:50:52,747 - INFO - Finished converting document 4_2024-10-17 in 0.11 sec.
2025-11-14 15:50:52,816 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,844 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-10-11' --> 'data\processed_data\BRK-B\4_2024-10-11.md'
Converted 'data\edgar_documents\BRK-B\4_2024-10-17' --> 'data\processed_data\BRK-B\4_2024-10-17.md'


2025-11-14 15:50:52,845 - INFO - Processing document 4_2024-10-18
2025-11-14 15:50:52,915 - INFO - Finished converting document 4_2024-10-18 in 0.11 sec.
2025-11-14 15:50:52,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:53,017 - INFO - Going to convert document batch...
2025-11-14 15:50:53,018 - INFO - Processing document 4_2024-10-31
2025-11-14 15:50:53,085 - INFO - Finished converting document 4_2024-10-31 in 0.11 sec.
2025-11-14 15:50:53,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-10-18' --> 'data\processed_data\BRK-B\4_2024-10-18.md'
Converted 'data\edgar_documents\BRK-B\4_2024-10-31' --> 'data\processed_data\BRK-B\4_2024-10-31.md'


2025-11-14 15:50:53,178 - INFO - Going to convert document batch...
2025-11-14 15:50:53,180 - INFO - Processing document 4_2024-11-07
2025-11-14 15:50:53,237 - INFO - Finished converting document 4_2024-11-07 in 0.09 sec.
2025-11-14 15:50:53,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:53,323 - INFO - Going to convert document batch...
2025-11-14 15:50:53,324 - INFO - Processing document 4_2024-11-22
2025-11-14 15:50:53,385 - INFO - Finished converting document 4_2024-11-22 in 0.11 sec.
2025-11-14 15:50:53,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-11-07' --> 'data\processed_data\BRK-B\4_2024-11-07.md'
Converted 'data\edgar_documents\BRK-B\4_2024-11-22' --> 'data\processed_data\BRK-B\4_2024-11-22.md'


2025-11-14 15:50:53,492 - INFO - Going to convert document batch...
2025-11-14 15:50:53,493 - INFO - Processing document 4_2024-11-25
2025-11-14 15:50:53,594 - INFO - Finished converting document 4_2024-11-25 in 0.16 sec.
2025-11-14 15:50:53,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:53,693 - INFO - Going to convert document batch...
2025-11-14 15:50:53,694 - INFO - Processing document 4_2024-12-04
2025-11-14 15:50:53,745 - INFO - Finished converting document 4_2024-12-04 in 0.09 sec.
2025-11-14 15:50:53,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:53,835 - INFO - Going to convert document batch...
2025-11-14 15:50:53,837 - INFO - Processing document 4_2024-12-11


Converted 'data\edgar_documents\BRK-B\4_2024-11-25' --> 'data\processed_data\BRK-B\4_2024-11-25.md'
Converted 'data\edgar_documents\BRK-B\4_2024-12-04' --> 'data\processed_data\BRK-B\4_2024-12-04.md'


2025-11-14 15:50:53,906 - INFO - Finished converting document 4_2024-12-11 in 0.11 sec.
2025-11-14 15:50:53,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,009 - INFO - Going to convert document batch...
2025-11-14 15:50:54,010 - INFO - Processing document 4_2024-12-19
2025-11-14 15:50:54,122 - INFO - Finished converting document 4_2024-12-19 in 0.17 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-12-11' --> 'data\processed_data\BRK-B\4_2024-12-11.md'


2025-11-14 15:50:54,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,277 - INFO - Going to convert document batch...
2025-11-14 15:50:54,278 - INFO - Processing document 4_2024-12-26
2025-11-14 15:50:54,391 - INFO - Finished converting document 4_2024-12-26 in 0.17 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-12-19' --> 'data\processed_data\BRK-B\4_2024-12-19.md'


2025-11-14 15:50:54,496 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,525 - INFO - Going to convert document batch...
2025-11-14 15:50:54,526 - INFO - Processing document 4_2024-12-27
2025-11-14 15:50:54,569 - INFO - Finished converting document 4_2024-12-27 in 0.08 sec.
2025-11-14 15:50:54,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,670 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-12-26' --> 'data\processed_data\BRK-B\4_2024-12-26.md'
Converted 'data\edgar_documents\BRK-B\4_2024-12-27' --> 'data\processed_data\BRK-B\4_2024-12-27.md'


2025-11-14 15:50:54,672 - INFO - Processing document 4_2024-12-30
2025-11-14 15:50:54,793 - INFO - Finished converting document 4_2024-12-30 in 0.19 sec.
2025-11-14 15:50:54,888 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,908 - INFO - Going to convert document batch...
2025-11-14 15:50:54,910 - INFO - Processing document 4_2025-01-03
2025-11-14 15:50:54,954 - INFO - Finished converting document 4_2025-01-03 in 0.08 sec.
2025-11-14 15:50:55,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:55,037 - INFO - Going to convert document batch...
2025-11-14 15:50:55,038 - INFO - Processing document 4_2025-01-17


Converted 'data\edgar_documents\BRK-B\4_2024-12-30' --> 'data\processed_data\BRK-B\4_2024-12-30.md'
Converted 'data\edgar_documents\BRK-B\4_2025-01-03' --> 'data\processed_data\BRK-B\4_2025-01-03.md'


2025-11-14 15:50:55,096 - INFO - Finished converting document 4_2025-01-17 in 0.09 sec.
2025-11-14 15:50:55,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:55,197 - INFO - Going to convert document batch...
2025-11-14 15:50:55,198 - INFO - Processing document 4_2025-02-03
2025-11-14 15:50:55,272 - INFO - Finished converting document 4_2025-02-03 in 0.11 sec.
2025-11-14 15:50:55,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2025-01-17' --> 'data\processed_data\BRK-B\4_2025-01-17.md'
Converted 'data\edgar_documents\BRK-B\4_2025-02-03' --> 'data\processed_data\BRK-B\4_2025-02-03.md'


2025-11-14 15:50:55,381 - INFO - Going to convert document batch...
2025-11-14 15:50:55,383 - INFO - Processing document 4_2025-02-11
2025-11-14 15:50:55,460 - INFO - Finished converting document 4_2025-02-11 in 0.11 sec.
2025-11-14 15:50:55,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:55,559 - INFO - Going to convert document batch...
2025-11-14 15:50:55,561 - INFO - Processing document 4_2025-02-13
2025-11-14 15:50:55,617 - INFO - Finished converting document 4_2025-02-13 in 0.09 sec.
2025-11-14 15:50:55,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2025-02-11' --> 'data\processed_data\BRK-B\4_2025-02-11.md'
Converted 'data\edgar_documents\BRK-B\4_2025-02-13' --> 'data\processed_data\BRK-B\4_2025-02-13.md'


2025-11-14 15:50:55,772 - INFO - Going to convert document batch...
2025-11-14 15:50:55,773 - INFO - Processing document 4_2025-02-19
2025-11-14 15:50:55,955 - INFO - Finished converting document 4_2025-02-19 in 0.27 sec.
2025-11-14 15:50:56,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:56,133 - INFO - Going to convert document batch...
2025-11-14 15:50:56,134 - INFO - Processing document 4_2025-02-25
2025-11-14 15:50:56,200 - INFO - Finished converting document 4_2025-02-25 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\4_2025-02-19' --> 'data\processed_data\BRK-B\4_2025-02-19.md'
Converted 'data\edgar_documents\BRK-B\4_2025-02-25' --> 'data\processed_data\BRK-B\4_2025-02-25.md'


2025-11-14 15:50:56,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:56,319 - INFO - Going to convert document batch...
2025-11-14 15:50:56,320 - INFO - Processing document 4_2025-03-04
2025-11-14 15:50:56,841 - INFO - Finished converting document 4_2025-03-04 in 0.59 sec.
2025-11-14 15:50:56,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:56,937 - INFO - Going to convert document batch...
2025-11-14 15:50:56,938 - INFO - Processing document 4_2025-03-14
2025-11-14 15:50:57,007 - INFO - Finished converting document 4_2025-03-14 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2025-03-04' --> 'data\processed_data\BRK-B\4_2025-03-04.md'
Converted 'data\edgar_documents\BRK-B\4_2025-03-14' --> 'data\processed_data\BRK-B\4_2025-03-14.md'


2025-11-14 15:50:57,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:57,112 - INFO - Going to convert document batch...
2025-11-14 15:50:57,114 - INFO - Processing document 4_2025-03-21
2025-11-14 15:50:57,155 - INFO - Finished converting document 4_2025-03-21 in 0.09 sec.
2025-11-14 15:50:57,234 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:57,235 - ERROR - Input document 4_2025-04-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50

Converted 'data\edgar_documents\BRK-B\4_2025-03-21' --> 'data\processed_data\BRK-B\4_2025-03-21.md'
Error processing data\edgar_documents\BRK-B\4_2025-04-01: File format not allowed: data\edgar_documents\BRK-B\4_2025-04-01


2025-11-14 15:50:57,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:57,438 - INFO - Going to convert document batch...
2025-11-14 15:50:57,439 - INFO - Processing document 4_2025-04-09
2025-11-14 15:50:57,487 - INFO - Finished converting document 4_2025-04-09 in 0.08 sec.
2025-11-14 15:50:57,569 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:57,571 - ERROR - Input document 4_2025-04-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50

Converted 'data\edgar_documents\BRK-B\4_2025-04-04' --> 'data\processed_data\BRK-B\4_2025-04-04.md'
Converted 'data\edgar_documents\BRK-B\4_2025-04-09' --> 'data\processed_data\BRK-B\4_2025-04-09.md'
Error processing data\edgar_documents\BRK-B\4_2025-04-15: File format not allowed: data\edgar_documents\BRK-B\4_2025-04-15


2025-11-14 15:50:57,615 - INFO - Going to convert document batch...
2025-11-14 15:50:57,617 - INFO - Processing document 4_2025-05-12
2025-11-14 15:50:57,679 - INFO - Finished converting document 4_2025-05-12 in 0.09 sec.
2025-11-14 15:50:57,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:57,776 - INFO - Going to convert document batch...
2025-11-14 15:50:57,778 - INFO - Processing document 4_2025-05-15
2025-11-14 15:50:57,829 - INFO - Finished converting document 4_2025-05-15 in 0.09 sec.
2025-11-14 15:50:57,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2025-05-12' --> 'data\processed_data\BRK-B\4_2025-05-12.md'
Converted 'data\edgar_documents\BRK-B\4_2025-05-15' --> 'data\processed_data\BRK-B\4_2025-05-15.md'


2025-11-14 15:50:57,938 - INFO - Going to convert document batch...
2025-11-14 15:50:57,939 - INFO - Processing document 4_2025-05-27
2025-11-14 15:50:58,024 - INFO - Finished converting document 4_2025-05-27 in 0.14 sec.
2025-11-14 15:50:58,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,124 - INFO - Going to convert document batch...
2025-11-14 15:50:58,126 - INFO - Processing document 4_2025-06-30
2025-11-14 15:50:58,186 - INFO - Finished converting document 4_2025-06-30 in 0.09 sec.
2025-11-14 15:50:58,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,283 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2025-05-27' --> 'data\processed_data\BRK-B\4_2025-05-27.md'
Converted 'data\edgar_documents\BRK-B\4_2025-06-30' --> 'data\processed_data\BRK-B\4_2025-06-30.md'


2025-11-14 15:50:58,284 - INFO - Processing document 4_2025-07-16
2025-11-14 15:50:58,341 - INFO - Finished converting document 4_2025-07-16 in 0.11 sec.
2025-11-14 15:50:58,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,442 - INFO - Going to convert document batch...
2025-11-14 15:50:58,443 - INFO - Processing document 4_2025-08-01
2025-11-14 15:50:58,495 - INFO - Finished converting document 4_2025-08-01 in 0.09 sec.
2025-11-14 15:50:58,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,592 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2025-07-16' --> 'data\processed_data\BRK-B\4_2025-07-16.md'
Converted 'data\edgar_documents\BRK-B\4_2025-08-01' --> 'data\processed_data\BRK-B\4_2025-08-01.md'


2025-11-14 15:50:58,593 - INFO - Processing document 4_2025-08-04
2025-11-14 15:50:58,654 - INFO - Finished converting document 4_2025-08-04 in 0.11 sec.
2025-11-14 15:50:58,721 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,746 - INFO - Going to convert document batch...
2025-11-14 15:50:58,748 - INFO - Processing document 4_2025-08-08
2025-11-14 15:50:58,806 - INFO - Finished converting document 4_2025-08-08 in 0.09 sec.
2025-11-14 15:50:58,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,901 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2025-08-04' --> 'data\processed_data\BRK-B\4_2025-08-04.md'
Converted 'data\edgar_documents\BRK-B\4_2025-08-08' --> 'data\processed_data\BRK-B\4_2025-08-08.md'


2025-11-14 15:50:58,902 - INFO - Processing document 4_2025-09-26
2025-11-14 15:50:58,979 - INFO - Finished converting document 4_2025-09-26 in 0.12 sec.
2025-11-14 15:50:59,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,081 - INFO - Going to convert document batch...
2025-11-14 15:50:59,082 - INFO - Processing document 4_2025-10-24
2025-11-14 15:50:59,148 - INFO - Finished converting document 4_2025-10-24 in 0.09 sec.


Converted 'data\edgar_documents\BRK-B\4_2025-09-26' --> 'data\processed_data\BRK-B\4_2025-09-26.md'
Converted 'data\edgar_documents\BRK-B\4_2025-10-24' --> 'data\processed_data\BRK-B\4_2025-10-24.md'


2025-11-14 15:50:59,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,269 - INFO - Going to convert document batch...
2025-11-14 15:50:59,271 - INFO - Processing document 4_2025-10-29
2025-11-14 15:50:59,331 - INFO - Finished converting document 4_2025-10-29 in 0.12 sec.
2025-11-14 15:50:59,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,436 - INFO - Going to convert document batch...
2025-11-14 15:50:59,438 - INFO - Processing document 4_2025-11-05
2025-11-14 15:50:59,505 - INFO - Finished converting document 4_2025-11-05 in 0.11 sec.
2025-11-14 15:50:59,596 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BRK-B\4_2025-10-29' --> 'data\processed_data\BRK-B\4_2025-10-29.md'
Converted 'data\edgar_documents\BRK-B\4_2025-11-05' --> 'data\processed_data\BRK-B\4_2025-11-05.md'


2025-11-14 15:50:59,596 - ERROR - Input document 4_2025-11-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:59,599 - INFO - Going to convert document batch...
2025-11-14 15:50:59,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,665 - INFO - Going to convert document batch...
2025-11-14 15:50:59,666 - INFO - Processing document 8-K_2023-03-01
2025-11-14 15:50:59,723 - INFO - Finished converting document 8-K_2023-03-01 in 0.12 sec.
2025-11-14 15:50:59,800 - INFO - d

Error processing data\edgar_documents\BRK-B\4_2025-11-06: File format not allowed: data\edgar_documents\BRK-B\4_2025-11-06
Converted 'data\edgar_documents\BRK-B\8-K_2023-03-01' --> 'data\processed_data\BRK-B\8-K_2023-03-01.md'


2025-11-14 15:50:59,834 - INFO - Going to convert document batch...
2025-11-14 15:50:59,835 - INFO - Processing document 8-K_2023-04-20
2025-11-14 15:50:59,887 - INFO - Finished converting document 8-K_2023-04-20 in 0.14 sec.
2025-11-14 15:50:59,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,972 - INFO - Going to convert document batch...
2025-11-14 15:50:59,973 - INFO - Processing document 8-K_2023-05-02
2025-11-14 15:51:00,023 - INFO - Finished converting document 8-K_2023-05-02 in 0.11 sec.
2025-11-14 15:51:00,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\8-K_2023-04-20' --> 'data\processed_data\BRK-B\8-K_2023-04-20.md'
Converted 'data\edgar_documents\BRK-B\8-K_2023-05-02' --> 'data\processed_data\BRK-B\8-K_2023-05-02.md'


2025-11-14 15:51:00,127 - INFO - Going to convert document batch...
2025-11-14 15:51:00,128 - INFO - Processing document 8-K_2023-05-10
2025-11-14 15:51:00,228 - INFO - Finished converting document 8-K_2023-05-10 in 0.17 sec.
2025-11-14 15:51:00,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,315 - INFO - Going to convert document batch...
2025-11-14 15:51:00,316 - INFO - Processing document 8-K_2023-08-07
2025-11-14 15:51:00,369 - INFO - Finished converting document 8-K_2023-08-07 in 0.09 sec.
2025-11-14 15:51:00,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,470 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\8-K_2023-05-10' --> 'data\processed_data\BRK-B\8-K_2023-05-10.md'
Converted 'data\edgar_documents\BRK-B\8-K_2023-08-07' --> 'data\processed_data\BRK-B\8-K_2023-08-07.md'


2025-11-14 15:51:00,471 - INFO - Processing document 8-K_2023-11-07
2025-11-14 15:51:00,517 - INFO - Finished converting document 8-K_2023-11-07 in 0.12 sec.
2025-11-14 15:51:00,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,592 - INFO - Going to convert document batch...
2025-11-14 15:51:00,593 - INFO - Processing document 8-K_2023-11-29
2025-11-14 15:51:00,666 - INFO - Finished converting document 8-K_2023-11-29 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\8-K_2023-11-07' --> 'data\processed_data\BRK-B\8-K_2023-11-07.md'
Converted 'data\edgar_documents\BRK-B\8-K_2023-11-29' --> 'data\processed_data\BRK-B\8-K_2023-11-29.md'


2025-11-14 15:51:00,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,792 - INFO - Going to convert document batch...
2025-11-14 15:51:00,793 - INFO - Processing document 8-K_2023-12-01
2025-11-14 15:51:00,837 - INFO - Finished converting document 8-K_2023-12-01 in 0.12 sec.
2025-11-14 15:51:00,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,899 - INFO - Going to convert document batch...
2025-11-14 15:51:00,900 - INFO - Processing document 8-K_2024-01-10
2025-11-14 15:51:00,928 - INFO - Finished converting document 8-K_2024-01-10 in 0.06 sec.
2025-11-14 15:51:00,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,983 - INFO - Going to convert document batch...
2025-11-14 15:51:00,984 - INFO - Processing document 8-K_2024-02-26
2025-11-14 15:51:01,015 - INFO - Finished converting document 8-K_2024-02-26 in 0.08 sec.
2025-11-14 15:51:01,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\8-K_2023-12-01' --> 'data\processed_data\BRK-B\8-K_2023-12-01.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-01-10' --> 'data\processed_data\BRK-B\8-K_2024-01-10.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-02-26' --> 'data\processed_data\BRK-B\8-K_2024-02-26.md'


2025-11-14 15:51:01,066 - INFO - Going to convert document batch...
2025-11-14 15:51:01,068 - INFO - Processing document 8-K_2024-04-26
2025-11-14 15:51:01,110 - INFO - Finished converting document 8-K_2024-04-26 in 0.08 sec.
2025-11-14 15:51:01,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,174 - INFO - Going to convert document batch...
2025-11-14 15:51:01,175 - INFO - Processing document 8-K_2024-05-07
2025-11-14 15:51:01,218 - INFO - Finished converting document 8-K_2024-05-07 in 0.09 sec.
2025-11-14 15:51:01,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,266 - INFO - Going to convert document batch...
2025-11-14 15:51:01,266 - INFO - Processing document 8-K_2024-08-05
2025-11-14 15:51:01,289 - INFO - Finished converting document 8-K_2024-08-05 in 0.05 sec.
2025-11-14 15:51:01,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\8-K_2024-04-26' --> 'data\processed_data\BRK-B\8-K_2024-04-26.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-05-07' --> 'data\processed_data\BRK-B\8-K_2024-05-07.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-08-05' --> 'data\processed_data\BRK-B\8-K_2024-08-05.md'


2025-11-14 15:51:01,334 - INFO - Going to convert document batch...
2025-11-14 15:51:01,334 - INFO - Processing document 8-K_2024-10-23
2025-11-14 15:51:01,366 - INFO - Finished converting document 8-K_2024-10-23 in 0.06 sec.
2025-11-14 15:51:01,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,412 - INFO - Going to convert document batch...
2025-11-14 15:51:01,413 - INFO - Processing document 8-K_2024-11-04
2025-11-14 15:51:01,436 - INFO - Finished converting document 8-K_2024-11-04 in 0.06 sec.
2025-11-14 15:51:01,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,479 - INFO - Going to convert document batch...
2025-11-14 15:51:01,479 - INFO - Processing document 8-K_2025-02-24
2025-11-14 15:51:01,504 - INFO - Finished converting document 8-K_2025-02-24 in 0.05 sec.
2025-11-14 15:51:01,530 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,549 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\BRK-B\8-K_2024-10-23' --> 'data\processed_data\BRK-B\8-K_2024-10-23.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-11-04' --> 'data\processed_data\BRK-B\8-K_2024-11-04.md'
Converted 'data\edgar_documents\BRK-B\8-K_2025-02-24' --> 'data\processed_data\BRK-B\8-K_2025-02-24.md'


2025-11-14 15:51:01,578 - INFO - Finished converting document 8-K_2025-04-17 in 0.06 sec.
2025-11-14 15:51:01,609 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,650 - INFO - Going to convert document batch...
2025-11-14 15:51:01,652 - INFO - Processing document 8-K_2025-05-06
2025-11-14 15:51:01,698 - INFO - Finished converting document 8-K_2025-05-06 in 0.11 sec.
2025-11-14 15:51:01,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\8-K_2025-04-17' --> 'data\processed_data\BRK-B\8-K_2025-04-17.md'
Converted 'data\edgar_documents\BRK-B\8-K_2025-05-06' --> 'data\processed_data\BRK-B\8-K_2025-05-06.md'


2025-11-14 15:51:01,982 - INFO - Going to convert document batch...
2025-11-14 15:51:01,983 - INFO - Processing document 8-K_2025-05-08
2025-11-14 15:51:02,008 - INFO - Finished converting document 8-K_2025-05-08 in 0.28 sec.
2025-11-14 15:51:02,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:02,060 - INFO - Going to convert document batch...
2025-11-14 15:51:02,061 - INFO - Processing document 8-K_2025-08-04
2025-11-14 15:51:02,091 - INFO - Finished converting document 8-K_2025-08-04 in 0.08 sec.
2025-11-14 15:51:02,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:02,188 - INFO - Going to convert document batch...
2025-11-14 15:51:02,189 - INFO - Processing document 8-K_2025-10-03
2025-11-14 15:51:02,256 - INFO - Finished converting document 8-K_2025-10-03 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\8-K_2025-05-08' --> 'data\processed_data\BRK-B\8-K_2025-05-08.md'
Converted 'data\edgar_documents\BRK-B\8-K_2025-08-04' --> 'data\processed_data\BRK-B\8-K_2025-08-04.md'


2025-11-14 15:51:02,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:02,343 - INFO - Going to convert document batch...
2025-11-14 15:51:02,344 - INFO - Processing document 8-K_2025-11-03
2025-11-14 15:51:02,400 - INFO - Finished converting document 8-K_2025-11-03 in 0.11 sec.
2025-11-14 15:51:02,455 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:51:02,457 - ERROR - Input document DEF-14A_2023-03-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>

Converted 'data\edgar_documents\BRK-B\8-K_2025-10-03' --> 'data\processed_data\BRK-B\8-K_2025-10-03.md'
Converted 'data\edgar_documents\BRK-B\8-K_2025-11-03' --> 'data\processed_data\BRK-B\8-K_2025-11-03.md'
Error processing data\edgar_documents\BRK-B\DEF-14A_2023-03-17: File format not allowed: data\edgar_documents\BRK-B\DEF-14A_2023-03-17


2025-11-14 15:51:02,485 - ERROR - Input document DEF-14A_2024-03-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:51:02,488 - INFO - Going to convert document batch...
2025-11-14 15:51:02,512 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:51:02,513 - ERROR - Input document DEF-14A_2025-03-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: '

Error processing data\edgar_documents\BRK-B\DEF-14A_2024-03-15: File format not allowed: data\edgar_documents\BRK-B\DEF-14A_2024-03-15
Error processing data\edgar_documents\BRK-B\DEF-14A_2025-03-14: File format not allowed: data\edgar_documents\BRK-B\DEF-14A_2025-03-14
Processed 144 new files. Errors: 13
Found 165 files to process in data\edgar_documents\CAT


2025-11-14 15:51:06,792 - INFO - Going to convert document batch...
2025-11-14 15:51:06,795 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:51:06,796 - INFO - Processing document 10-K_2023-02-15
2025-11-14 15:51:17,096 - INFO - Finished converting document 10-K_2023-02-15 in 14.56 sec.
2025-11-14 15:51:19,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-K_2023-02-15' --> 'data\processed_data\CAT\10-K_2023-02-15.md'


2025-11-14 15:51:23,561 - INFO - Going to convert document batch...
2025-11-14 15:51:23,563 - INFO - Processing document 10-K_2024-02-16
2025-11-14 15:51:33,378 - INFO - Finished converting document 10-K_2024-02-16 in 13.75 sec.
2025-11-14 15:51:38,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-K_2024-02-16' --> 'data\processed_data\CAT\10-K_2024-02-16.md'


2025-11-14 15:51:42,369 - INFO - Going to convert document batch...
2025-11-14 15:51:42,370 - INFO - Processing document 10-K_2025-02-14
2025-11-14 15:51:52,404 - INFO - Finished converting document 10-K_2025-02-14 in 14.48 sec.
2025-11-14 15:51:55,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-K_2025-02-14' --> 'data\processed_data\CAT\10-K_2025-02-14.md'


2025-11-14 15:51:58,464 - INFO - Going to convert document batch...
2025-11-14 15:51:58,465 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 15:52:02,550 - INFO - Finished converting document 10-Q_2023-05-03 in 7.31 sec.
2025-11-14 15:52:04,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2023-05-03' --> 'data\processed_data\CAT\10-Q_2023-05-03.md'


2025-11-14 15:52:08,211 - INFO - Going to convert document batch...
2025-11-14 15:52:08,212 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 15:52:13,357 - INFO - Finished converting document 10-Q_2023-08-02 in 8.98 sec.
2025-11-14 15:52:15,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2023-08-02' --> 'data\processed_data\CAT\10-Q_2023-08-02.md'


2025-11-14 15:52:18,343 - INFO - Going to convert document batch...
2025-11-14 15:52:18,344 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 15:52:22,117 - INFO - Finished converting document 10-Q_2023-11-01 in 6.39 sec.
2025-11-14 15:52:25,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2023-11-01' --> 'data\processed_data\CAT\10-Q_2023-11-01.md'


2025-11-14 15:52:28,084 - INFO - Going to convert document batch...
2025-11-14 15:52:28,086 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 15:52:33,577 - INFO - Finished converting document 10-Q_2024-05-01 in 8.09 sec.
2025-11-14 15:52:35,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2024-05-01' --> 'data\processed_data\CAT\10-Q_2024-05-01.md'


2025-11-14 15:52:38,258 - INFO - Going to convert document batch...
2025-11-14 15:52:38,259 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 15:52:44,815 - INFO - Finished converting document 10-Q_2024-08-07 in 9.36 sec.
2025-11-14 15:52:47,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2024-08-07' --> 'data\processed_data\CAT\10-Q_2024-08-07.md'


2025-11-14 15:52:50,982 - INFO - Going to convert document batch...
2025-11-14 15:52:50,983 - INFO - Processing document 10-Q_2024-11-06
2025-11-14 15:52:56,817 - INFO - Finished converting document 10-Q_2024-11-06 in 9.59 sec.
2025-11-14 15:52:59,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2024-11-06' --> 'data\processed_data\CAT\10-Q_2024-11-06.md'


2025-11-14 15:53:02,745 - INFO - Going to convert document batch...
2025-11-14 15:53:02,747 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 15:53:06,971 - INFO - Finished converting document 10-Q_2025-05-07 in 7.50 sec.
2025-11-14 15:53:09,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2025-05-07' --> 'data\processed_data\CAT\10-Q_2025-05-07.md'


2025-11-14 15:53:13,206 - INFO - Going to convert document batch...
2025-11-14 15:53:13,208 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 15:53:19,134 - INFO - Finished converting document 10-Q_2025-08-06 in 10.06 sec.
2025-11-14 15:53:21,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2025-08-06' --> 'data\processed_data\CAT\10-Q_2025-08-06.md'


2025-11-14 15:53:25,469 - INFO - Going to convert document batch...
2025-11-14 15:53:25,470 - INFO - Processing document 10-Q_2025-11-03
2025-11-14 15:53:31,809 - INFO - Finished converting document 10-Q_2025-11-03 in 10.16 sec.
2025-11-14 15:53:34,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:34,403 - INFO - Going to convert document batch...
2025-11-14 15:53:34,404 - INFO - Processing document 4_2023-01-03
2025-11-14 15:53:34,448 - INFO - Finished converting document 4_2023-01-03 in 0.09 sec.
2025-11-14 15:53:34,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2025-11-03' --> 'data\processed_data\CAT\10-Q_2025-11-03.md'
Converted 'data\edgar_documents\CAT\4_2023-01-03' --> 'data\processed_data\CAT\4_2023-01-03.md'


2025-11-14 15:53:34,561 - INFO - Going to convert document batch...
2025-11-14 15:53:34,563 - INFO - Processing document 4_2023-01-09
2025-11-14 15:53:34,614 - INFO - Finished converting document 4_2023-01-09 in 0.09 sec.
2025-11-14 15:53:34,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:34,697 - INFO - Going to convert document batch...
2025-11-14 15:53:34,700 - INFO - Processing document 4_2023-01-10
2025-11-14 15:53:34,779 - INFO - Finished converting document 4_2023-01-10 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2023-01-09' --> 'data\processed_data\CAT\4_2023-01-09.md'
Converted 'data\edgar_documents\CAT\4_2023-01-10' --> 'data\processed_data\CAT\4_2023-01-10.md'


2025-11-14 15:53:34,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:34,909 - INFO - Going to convert document batch...
2025-11-14 15:53:34,910 - INFO - Processing document 4_2023-02-06
2025-11-14 15:53:35,013 - INFO - Finished converting document 4_2023-02-06 in 0.17 sec.
2025-11-14 15:53:35,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,110 - INFO - Going to convert document batch...
2025-11-14 15:53:35,112 - INFO - Processing document 4_2023-02-07
2025-11-14 15:53:35,158 - INFO - Finished converting document 4_2023-02-07 in 0.08 sec.
2025-11-14 15:53:35,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,253 - INFO - Going to convert document batch...
2025-11-14 15:53:35,255 - INFO - Processing document 4_2023-02-08


Converted 'data\edgar_documents\CAT\4_2023-02-06' --> 'data\processed_data\CAT\4_2023-02-06.md'
Converted 'data\edgar_documents\CAT\4_2023-02-07' --> 'data\processed_data\CAT\4_2023-02-07.md'


2025-11-14 15:53:35,293 - INFO - Finished converting document 4_2023-02-08 in 0.09 sec.
2025-11-14 15:53:35,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,373 - INFO - Going to convert document batch...
2025-11-14 15:53:35,374 - INFO - Processing document 4_2023-02-10
2025-11-14 15:53:35,415 - INFO - Finished converting document 4_2023-02-10 in 0.06 sec.
2025-11-14 15:53:35,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,502 - INFO - Going to convert document batch...
2025-11-14 15:53:35,504 - INFO - Processing document 4_2023-02-21


Converted 'data\edgar_documents\CAT\4_2023-02-08' --> 'data\processed_data\CAT\4_2023-02-08.md'
Converted 'data\edgar_documents\CAT\4_2023-02-10' --> 'data\processed_data\CAT\4_2023-02-10.md'


2025-11-14 15:53:35,564 - INFO - Finished converting document 4_2023-02-21 in 0.11 sec.
2025-11-14 15:53:35,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,648 - INFO - Going to convert document batch...
2025-11-14 15:53:35,649 - INFO - Processing document 4_2023-03-06
2025-11-14 15:53:35,696 - INFO - Finished converting document 4_2023-03-06 in 0.08 sec.
2025-11-14 15:53:35,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,774 - INFO - Going to convert document batch...
2025-11-14 15:53:35,775 - INFO - Processing document 4_2023-03-08


Converted 'data\edgar_documents\CAT\4_2023-02-21' --> 'data\processed_data\CAT\4_2023-02-21.md'
Converted 'data\edgar_documents\CAT\4_2023-03-06' --> 'data\processed_data\CAT\4_2023-03-06.md'


2025-11-14 15:53:35,815 - INFO - Finished converting document 4_2023-03-08 in 0.08 sec.
2025-11-14 15:53:35,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,899 - INFO - Going to convert document batch...
2025-11-14 15:53:35,900 - INFO - Processing document 4_2023-03-14
2025-11-14 15:53:35,945 - INFO - Finished converting document 4_2023-03-14 in 0.08 sec.
2025-11-14 15:53:36,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2023-03-08' --> 'data\processed_data\CAT\4_2023-03-08.md'
Converted 'data\edgar_documents\CAT\4_2023-03-14' --> 'data\processed_data\CAT\4_2023-03-14.md'


2025-11-14 15:53:36,058 - INFO - Going to convert document batch...
2025-11-14 15:53:36,066 - INFO - Processing document 4_2023-03-16
2025-11-14 15:53:36,115 - INFO - Finished converting document 4_2023-03-16 in 0.11 sec.
2025-11-14 15:53:36,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:36,211 - INFO - Going to convert document batch...
2025-11-14 15:53:36,212 - INFO - Processing document 4_2023-04-04
2025-11-14 15:53:36,260 - INFO - Finished converting document 4_2023-04-04 in 0.11 sec.
2025-11-14 15:53:36,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2023-03-16' --> 'data\processed_data\CAT\4_2023-03-16.md'
Converted 'data\edgar_documents\CAT\4_2023-04-04' --> 'data\processed_data\CAT\4_2023-04-04.md'


2025-11-14 15:53:36,355 - INFO - Going to convert document batch...
2025-11-14 15:53:36,357 - INFO - Processing document 4_2023-05-31
2025-11-14 15:53:36,414 - INFO - Finished converting document 4_2023-05-31 in 0.08 sec.
2025-11-14 15:53:36,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:36,519 - INFO - Going to convert document batch...
2025-11-14 15:53:36,520 - INFO - Processing document 4_2023-06-09
2025-11-14 15:53:36,570 - INFO - Finished converting document 4_2023-06-09 in 0.08 sec.
2025-11-14 15:53:36,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:36,664 - INFO - Going to convert document batch...
2025-11-14 15:53:36,666 - INFO - Processing document 4_2023-06-15


Converted 'data\edgar_documents\CAT\4_2023-05-31' --> 'data\processed_data\CAT\4_2023-05-31.md'
Converted 'data\edgar_documents\CAT\4_2023-06-09' --> 'data\processed_data\CAT\4_2023-06-09.md'


2025-11-14 15:53:36,709 - INFO - Finished converting document 4_2023-06-15 in 0.08 sec.
2025-11-14 15:53:36,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:36,803 - INFO - Going to convert document batch...
2025-11-14 15:53:36,804 - INFO - Processing document 4_2023-06-27
2025-11-14 15:53:36,850 - INFO - Finished converting document 4_2023-06-27 in 0.08 sec.
2025-11-14 15:53:36,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2023-06-15' --> 'data\processed_data\CAT\4_2023-06-15.md'
Converted 'data\edgar_documents\CAT\4_2023-06-27' --> 'data\processed_data\CAT\4_2023-06-27.md'


2025-11-14 15:53:36,963 - INFO - Going to convert document batch...
2025-11-14 15:53:36,965 - INFO - Processing document 4_2023-07-03
2025-11-14 15:53:37,022 - INFO - Finished converting document 4_2023-07-03 in 0.11 sec.
2025-11-14 15:53:37,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,159 - INFO - Going to convert document batch...
2025-11-14 15:53:37,160 - INFO - Processing document 4_2023-07-19
2025-11-14 15:53:37,215 - INFO - Finished converting document 4_2023-07-19 in 0.11 sec.
2025-11-14 15:53:37,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2023-07-03' --> 'data\processed_data\CAT\4_2023-07-03.md'
Converted 'data\edgar_documents\CAT\4_2023-07-19' --> 'data\processed_data\CAT\4_2023-07-19.md'


2025-11-14 15:53:37,322 - INFO - Going to convert document batch...
2025-11-14 15:53:37,325 - INFO - Processing document 4_2023-07-28
2025-11-14 15:53:37,371 - INFO - Finished converting document 4_2023-07-28 in 0.11 sec.
2025-11-14 15:53:37,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,452 - INFO - Going to convert document batch...
2025-11-14 15:53:37,454 - INFO - Processing document 4_2023-08-02
2025-11-14 15:53:37,506 - INFO - Finished converting document 4_2023-08-02 in 0.09 sec.
2025-11-14 15:53:37,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,616 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2023-07-28' --> 'data\processed_data\CAT\4_2023-07-28.md'
Converted 'data\edgar_documents\CAT\4_2023-08-02' --> 'data\processed_data\CAT\4_2023-08-02.md'


2025-11-14 15:53:37,618 - INFO - Processing document 4_2023-08-03
2025-11-14 15:53:37,686 - INFO - Finished converting document 4_2023-08-03 in 0.14 sec.
2025-11-14 15:53:37,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,787 - INFO - Going to convert document batch...
2025-11-14 15:53:37,788 - INFO - Processing document 4_2023-08-04
2025-11-14 15:53:37,856 - INFO - Finished converting document 4_2023-08-04 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2023-08-03' --> 'data\processed_data\CAT\4_2023-08-03.md'
Converted 'data\edgar_documents\CAT\4_2023-08-04' --> 'data\processed_data\CAT\4_2023-08-04.md'


2025-11-14 15:53:37,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,978 - INFO - Going to convert document batch...
2025-11-14 15:53:37,979 - INFO - Processing document 4_2023-08-07
2025-11-14 15:53:38,035 - INFO - Finished converting document 4_2023-08-07 in 0.11 sec.
2025-11-14 15:53:38,097 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,119 - INFO - Going to convert document batch...
2025-11-14 15:53:38,120 - INFO - Processing document 4_2023-08-08
2025-11-14 15:53:38,158 - INFO - Finished converting document 4_2023-08-08 in 0.08 sec.
2025-11-14 15:53:38,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,228 - INFO - Going to convert document batch...
2025-11-14 15:53:38,229 - INFO - Processing document 4_2023-08-10
2025-11-14 15:53:38,285 - INFO - Finished converting document 4_2023-08-10 in 0.09 sec.


Converted 'data\edgar_documents\CAT\4_2023-08-07' --> 'data\processed_data\CAT\4_2023-08-07.md'
Converted 'data\edgar_documents\CAT\4_2023-08-08' --> 'data\processed_data\CAT\4_2023-08-08.md'


2025-11-14 15:53:38,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,371 - INFO - Going to convert document batch...
2025-11-14 15:53:38,372 - INFO - Processing document 4_2023-08-28
2025-11-14 15:53:38,419 - INFO - Finished converting document 4_2023-08-28 in 0.08 sec.
2025-11-14 15:53:38,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,537 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2023-08-10' --> 'data\processed_data\CAT\4_2023-08-10.md'
Converted 'data\edgar_documents\CAT\4_2023-08-28' --> 'data\processed_data\CAT\4_2023-08-28.md'


2025-11-14 15:53:38,539 - INFO - Processing document 4_2023-08-31
2025-11-14 15:53:38,612 - INFO - Finished converting document 4_2023-08-31 in 0.14 sec.
2025-11-14 15:53:38,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,705 - INFO - Going to convert document batch...
2025-11-14 15:53:38,707 - INFO - Processing document 4_2023-09-05
2025-11-14 15:53:38,752 - INFO - Finished converting document 4_2023-09-05 in 0.08 sec.
2025-11-14 15:53:38,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,863 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2023-08-31' --> 'data\processed_data\CAT\4_2023-08-31.md'
Converted 'data\edgar_documents\CAT\4_2023-09-05' --> 'data\processed_data\CAT\4_2023-09-05.md'


2025-11-14 15:53:38,864 - INFO - Processing document 4_2023-09-27
2025-11-14 15:53:38,916 - INFO - Finished converting document 4_2023-09-27 in 0.11 sec.
2025-11-14 15:53:38,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,019 - INFO - Going to convert document batch...
2025-11-14 15:53:39,022 - INFO - Processing document 4_2023-10-02
2025-11-14 15:53:39,084 - INFO - Finished converting document 4_2023-10-02 in 0.11 sec.


Converted 'data\edgar_documents\CAT\4_2023-09-27' --> 'data\processed_data\CAT\4_2023-09-27.md'
Converted 'data\edgar_documents\CAT\4_2023-10-02' --> 'data\processed_data\CAT\4_2023-10-02.md'


2025-11-14 15:53:39,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,203 - INFO - Going to convert document batch...
2025-11-14 15:53:39,205 - INFO - Processing document 4_2023-10-27
2025-11-14 15:53:39,253 - INFO - Finished converting document 4_2023-10-27 in 0.11 sec.
2025-11-14 15:53:39,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,385 - INFO - Going to convert document batch...
2025-11-14 15:53:39,388 - INFO - Processing document 4_2023-11-27
2025-11-14 15:53:39,434 - INFO - Finished converting document 4_2023-11-27 in 0.11 sec.
2025-11-14 15:53:39,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,526 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2023-10-27' --> 'data\processed_data\CAT\4_2023-10-27.md'
Converted 'data\edgar_documents\CAT\4_2023-11-27' --> 'data\processed_data\CAT\4_2023-11-27.md'


2025-11-14 15:53:39,527 - INFO - Processing document 4_2023-12-19
2025-11-14 15:53:39,592 - INFO - Finished converting document 4_2023-12-19 in 0.11 sec.
2025-11-14 15:53:39,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,674 - INFO - Going to convert document batch...
2025-11-14 15:53:39,676 - INFO - Processing document 4_2023-12-27
2025-11-14 15:53:39,717 - INFO - Finished converting document 4_2023-12-27 in 0.08 sec.
2025-11-14 15:53:39,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,820 - INFO - Going to convert document batch...
2025-11-14 15:53:39,822 - INFO - Processing document 4_2024-01-02


Converted 'data\edgar_documents\CAT\4_2023-12-19' --> 'data\processed_data\CAT\4_2023-12-19.md'
Converted 'data\edgar_documents\CAT\4_2023-12-27' --> 'data\processed_data\CAT\4_2023-12-27.md'


2025-11-14 15:53:39,888 - INFO - Finished converting document 4_2024-01-02 in 0.12 sec.
2025-11-14 15:53:39,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,990 - INFO - Going to convert document batch...
2025-11-14 15:53:39,992 - INFO - Processing document 4_2024-01-16
2025-11-14 15:53:40,031 - INFO - Finished converting document 4_2024-01-16 in 0.08 sec.
2025-11-14 15:53:40,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,121 - INFO - Going to convert document batch...
2025-11-14 15:53:40,123 - INFO - Processing document 4_2024-01-26
2025-11-14 15:53:40,162 - INFO - Finished converting document 4_2024-01-26 in 0.09 sec.


Converted 'data\edgar_documents\CAT\4_2024-01-02' --> 'data\processed_data\CAT\4_2024-01-02.md'
Converted 'data\edgar_documents\CAT\4_2024-01-16' --> 'data\processed_data\CAT\4_2024-01-16.md'


2025-11-14 15:53:40,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,241 - INFO - Going to convert document batch...
2025-11-14 15:53:40,242 - INFO - Processing document 4_2024-02-06
2025-11-14 15:53:40,298 - INFO - Finished converting document 4_2024-02-06 in 0.09 sec.
2025-11-14 15:53:40,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,403 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-01-26' --> 'data\processed_data\CAT\4_2024-01-26.md'
Converted 'data\edgar_documents\CAT\4_2024-02-06' --> 'data\processed_data\CAT\4_2024-02-06.md'


2025-11-14 15:53:40,404 - INFO - Processing document 4_2024-02-08
2025-11-14 15:53:40,462 - INFO - Finished converting document 4_2024-02-08 in 0.11 sec.
2025-11-14 15:53:40,530 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,549 - INFO - Going to convert document batch...
2025-11-14 15:53:40,551 - INFO - Processing document 4_2024-02-15
2025-11-14 15:53:40,600 - INFO - Finished converting document 4_2024-02-15 in 0.08 sec.
2025-11-14 15:53:40,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,694 - INFO - Going to convert document batch...
2025-11-14 15:53:40,696 - INFO - Processing document 4_2024-02-16


Converted 'data\edgar_documents\CAT\4_2024-02-08' --> 'data\processed_data\CAT\4_2024-02-08.md'
Converted 'data\edgar_documents\CAT\4_2024-02-15' --> 'data\processed_data\CAT\4_2024-02-15.md'


2025-11-14 15:53:40,757 - INFO - Finished converting document 4_2024-02-16 in 0.11 sec.
2025-11-14 15:53:40,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,852 - INFO - Going to convert document batch...
2025-11-14 15:53:40,853 - INFO - Processing document 4_2024-02-23
2025-11-14 15:53:40,901 - INFO - Finished converting document 4_2024-02-23 in 0.09 sec.
2025-11-14 15:53:40,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,012 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-02-16' --> 'data\processed_data\CAT\4_2024-02-16.md'
Converted 'data\edgar_documents\CAT\4_2024-02-23' --> 'data\processed_data\CAT\4_2024-02-23.md'


2025-11-14 15:53:41,013 - INFO - Processing document 4_2024-02-26
2025-11-14 15:53:41,072 - INFO - Finished converting document 4_2024-02-26 in 0.08 sec.
2025-11-14 15:53:41,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,181 - INFO - Going to convert document batch...
2025-11-14 15:53:41,182 - INFO - Processing document 4_2024-02-27
2025-11-14 15:53:41,235 - INFO - Finished converting document 4_2024-02-27 in 0.09 sec.
2025-11-14 15:53:41,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,333 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-02-26' --> 'data\processed_data\CAT\4_2024-02-26.md'
Converted 'data\edgar_documents\CAT\4_2024-02-27' --> 'data\processed_data\CAT\4_2024-02-27.md'


2025-11-14 15:53:41,335 - INFO - Processing document 4_2024-02-29
2025-11-14 15:53:41,394 - INFO - Finished converting document 4_2024-02-29 in 0.11 sec.
2025-11-14 15:53:41,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,500 - INFO - Going to convert document batch...
2025-11-14 15:53:41,501 - INFO - Processing document 4_2024-03-05
2025-11-14 15:53:41,552 - INFO - Finished converting document 4_2024-03-05 in 0.11 sec.


Converted 'data\edgar_documents\CAT\4_2024-02-29' --> 'data\processed_data\CAT\4_2024-02-29.md'
Converted 'data\edgar_documents\CAT\4_2024-03-05' --> 'data\processed_data\CAT\4_2024-03-05.md'


2025-11-14 15:53:41,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,645 - INFO - Going to convert document batch...
2025-11-14 15:53:41,646 - INFO - Processing document 4_2024-03-06
2025-11-14 15:53:41,717 - INFO - Finished converting document 4_2024-03-06 in 0.12 sec.
2025-11-14 15:53:41,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,821 - INFO - Going to convert document batch...
2025-11-14 15:53:41,823 - INFO - Processing document 4_2024-03-08
2025-11-14 15:53:41,894 - INFO - Finished converting document 4_2024-03-08 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2024-03-06' --> 'data\processed_data\CAT\4_2024-03-06.md'
Converted 'data\edgar_documents\CAT\4_2024-03-08' --> 'data\processed_data\CAT\4_2024-03-08.md'


2025-11-14 15:53:41,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,006 - INFO - Going to convert document batch...
2025-11-14 15:53:42,008 - INFO - Processing document 4_2024-03-12
2025-11-14 15:53:42,082 - INFO - Finished converting document 4_2024-03-12 in 0.12 sec.
2025-11-14 15:53:42,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,160 - INFO - Going to convert document batch...
2025-11-14 15:53:42,161 - INFO - Processing document 4_2024-03-18
2025-11-14 15:53:42,214 - INFO - Finished converting document 4_2024-03-18 in 0.09 sec.
2025-11-14 15:53:42,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,305 - INFO - Going to convert document batch...
2025-11-14 15:53:42,306 - INFO - Processing document 4_2024-04-01


Converted 'data\edgar_documents\CAT\4_2024-03-12' --> 'data\processed_data\CAT\4_2024-03-12.md'
Converted 'data\edgar_documents\CAT\4_2024-03-18' --> 'data\processed_data\CAT\4_2024-03-18.md'


2025-11-14 15:53:42,361 - INFO - Finished converting document 4_2024-04-01 in 0.09 sec.
2025-11-14 15:53:42,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,479 - INFO - Going to convert document batch...
2025-11-14 15:53:42,481 - INFO - Processing document 4_2024-04-02
2025-11-14 15:53:42,532 - INFO - Finished converting document 4_2024-04-02 in 0.11 sec.
2025-11-14 15:53:42,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,616 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-04-01' --> 'data\processed_data\CAT\4_2024-04-01.md'
Converted 'data\edgar_documents\CAT\4_2024-04-02' --> 'data\processed_data\CAT\4_2024-04-02.md'


2025-11-14 15:53:42,617 - INFO - Processing document 4_2024-04-29
2025-11-14 15:53:42,666 - INFO - Finished converting document 4_2024-04-29 in 0.08 sec.
2025-11-14 15:53:42,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,755 - INFO - Going to convert document batch...
2025-11-14 15:53:42,756 - INFO - Processing document 4_2024-04-30
2025-11-14 15:53:42,800 - INFO - Finished converting document 4_2024-04-30 in 0.08 sec.
2025-11-14 15:53:42,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,890 - INFO - Going to convert document batch...
2025-11-14 15:53:42,891 - INFO - Processing document 4_2024-05-02


Converted 'data\edgar_documents\CAT\4_2024-04-29' --> 'data\processed_data\CAT\4_2024-04-29.md'
Converted 'data\edgar_documents\CAT\4_2024-04-30' --> 'data\processed_data\CAT\4_2024-04-30.md'


2025-11-14 15:53:42,936 - INFO - Finished converting document 4_2024-05-02 in 0.09 sec.
2025-11-14 15:53:42,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,018 - INFO - Going to convert document batch...
2025-11-14 15:53:43,019 - INFO - Processing document 4_2024-05-06
2025-11-14 15:53:43,068 - INFO - Finished converting document 4_2024-05-06 in 0.08 sec.
2025-11-14 15:53:43,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,157 - INFO - Going to convert document batch...
2025-11-14 15:53:43,160 - INFO - Processing document 4_2024-05-07


Converted 'data\edgar_documents\CAT\4_2024-05-02' --> 'data\processed_data\CAT\4_2024-05-02.md'
Converted 'data\edgar_documents\CAT\4_2024-05-06' --> 'data\processed_data\CAT\4_2024-05-06.md'


2025-11-14 15:53:43,210 - INFO - Finished converting document 4_2024-05-07 in 0.09 sec.
2025-11-14 15:53:43,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,304 - INFO - Going to convert document batch...
2025-11-14 15:53:43,305 - INFO - Processing document 4_2024-05-08
2025-11-14 15:53:43,362 - INFO - Finished converting document 4_2024-05-08 in 0.09 sec.
2025-11-14 15:53:43,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,465 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-05-07' --> 'data\processed_data\CAT\4_2024-05-07.md'
Converted 'data\edgar_documents\CAT\4_2024-05-08' --> 'data\processed_data\CAT\4_2024-05-08.md'


2025-11-14 15:53:43,466 - INFO - Processing document 4_2024-05-14
2025-11-14 15:53:43,524 - INFO - Finished converting document 4_2024-05-14 in 0.11 sec.
2025-11-14 15:53:43,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,606 - INFO - Going to convert document batch...
2025-11-14 15:53:43,607 - INFO - Processing document 4_2024-05-22
2025-11-14 15:53:43,675 - INFO - Finished converting document 4_2024-05-22 in 0.09 sec.
2025-11-14 15:53:43,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,767 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-05-14' --> 'data\processed_data\CAT\4_2024-05-14.md'
Converted 'data\edgar_documents\CAT\4_2024-05-22' --> 'data\processed_data\CAT\4_2024-05-22.md'


2025-11-14 15:53:43,769 - INFO - Processing document 4_2024-05-28
2025-11-14 15:53:43,814 - INFO - Finished converting document 4_2024-05-28 in 0.09 sec.
2025-11-14 15:53:43,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,885 - INFO - Going to convert document batch...
2025-11-14 15:53:43,887 - INFO - Processing document 4_2024-05-31
2025-11-14 15:53:43,925 - INFO - Finished converting document 4_2024-05-31 in 0.06 sec.
2025-11-14 15:53:43,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,005 - INFO - Going to convert document batch...
2025-11-14 15:53:44,006 - INFO - Processing document 4_2024-06-13
2025-11-14 15:53:44,046 - INFO - Finished converting document 4_2024-06-13 in 0.09 sec.


Converted 'data\edgar_documents\CAT\4_2024-05-28' --> 'data\processed_data\CAT\4_2024-05-28.md'
Converted 'data\edgar_documents\CAT\4_2024-05-31' --> 'data\processed_data\CAT\4_2024-05-31.md'


2025-11-14 15:53:44,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,138 - INFO - Going to convert document batch...
2025-11-14 15:53:44,140 - INFO - Processing document 4_2024-06-27
2025-11-14 15:53:44,191 - INFO - Finished converting document 4_2024-06-27 in 0.08 sec.
2025-11-14 15:53:44,253 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,273 - INFO - Going to convert document batch...
2025-11-14 15:53:44,274 - INFO - Processing document 4_2024-07-01
2025-11-14 15:53:44,318 - INFO - Finished converting document 4_2024-07-01 in 0.08 sec.


Converted 'data\edgar_documents\CAT\4_2024-06-13' --> 'data\processed_data\CAT\4_2024-06-13.md'
Converted 'data\edgar_documents\CAT\4_2024-06-27' --> 'data\processed_data\CAT\4_2024-06-27.md'


2025-11-14 15:53:44,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,399 - INFO - Going to convert document batch...
2025-11-14 15:53:44,401 - INFO - Processing document 4_2024-07-17
2025-11-14 15:53:44,493 - INFO - Finished converting document 4_2024-07-17 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2024-07-01' --> 'data\processed_data\CAT\4_2024-07-01.md'
Converted 'data\edgar_documents\CAT\4_2024-07-17' --> 'data\processed_data\CAT\4_2024-07-17.md'


2025-11-14 15:53:44,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,601 - INFO - Going to convert document batch...
2025-11-14 15:53:44,603 - INFO - Processing document 4_2024-07-29
2025-11-14 15:53:44,654 - INFO - Finished converting document 4_2024-07-29 in 0.11 sec.
2025-11-14 15:53:44,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,736 - INFO - Going to convert document batch...
2025-11-14 15:53:44,738 - INFO - Processing document 4_2024-08-23
2025-11-14 15:53:44,783 - INFO - Finished converting document 4_2024-08-23 in 0.08 sec.
2025-11-14 15:53:44,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,886 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-07-29' --> 'data\processed_data\CAT\4_2024-07-29.md'
Converted 'data\edgar_documents\CAT\4_2024-08-23' --> 'data\processed_data\CAT\4_2024-08-23.md'


2025-11-14 15:53:44,887 - INFO - Processing document 4_2024-08-27
2025-11-14 15:53:44,946 - INFO - Finished converting document 4_2024-08-27 in 0.09 sec.
2025-11-14 15:53:45,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,036 - INFO - Going to convert document batch...
2025-11-14 15:53:45,037 - INFO - Processing document 4_2024-09-03
2025-11-14 15:53:45,102 - INFO - Finished converting document 4_2024-09-03 in 0.09 sec.
2025-11-14 15:53:45,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,194 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-08-27' --> 'data\processed_data\CAT\4_2024-08-27.md'
Converted 'data\edgar_documents\CAT\4_2024-09-03' --> 'data\processed_data\CAT\4_2024-09-03.md'


2025-11-14 15:53:45,196 - INFO - Processing document 4_2024-09-05
2025-11-14 15:53:45,240 - INFO - Finished converting document 4_2024-09-05 in 0.08 sec.
2025-11-14 15:53:45,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,322 - INFO - Going to convert document batch...
2025-11-14 15:53:45,324 - INFO - Processing document 4_2024-09-27
2025-11-14 15:53:45,373 - INFO - Finished converting document 4_2024-09-27 in 0.09 sec.
2025-11-14 15:53:45,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2024-09-05' --> 'data\processed_data\CAT\4_2024-09-05.md'
Converted 'data\edgar_documents\CAT\4_2024-09-27' --> 'data\processed_data\CAT\4_2024-09-27.md'


2025-11-14 15:53:45,470 - INFO - Going to convert document batch...
2025-11-14 15:53:45,472 - INFO - Processing document 4_2024-10-01
2025-11-14 15:53:45,523 - INFO - Finished converting document 4_2024-10-01 in 0.09 sec.
2025-11-14 15:53:45,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,605 - INFO - Going to convert document batch...
2025-11-14 15:53:45,607 - INFO - Processing document 4_2024-10-28
2025-11-14 15:53:45,660 - INFO - Finished converting document 4_2024-10-28 in 0.09 sec.
2025-11-14 15:53:45,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2024-10-01' --> 'data\processed_data\CAT\4_2024-10-01.md'
Converted 'data\edgar_documents\CAT\4_2024-10-28' --> 'data\processed_data\CAT\4_2024-10-28.md'


2025-11-14 15:53:45,768 - INFO - Going to convert document batch...
2025-11-14 15:53:45,771 - INFO - Processing document 4_2024-11-04
2025-11-14 15:53:45,831 - INFO - Finished converting document 4_2024-11-04 in 0.11 sec.
2025-11-14 15:53:45,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,928 - INFO - Going to convert document batch...
2025-11-14 15:53:45,929 - INFO - Processing document 4_2024-11-05
2025-11-14 15:53:45,973 - INFO - Finished converting document 4_2024-11-05 in 0.08 sec.
2025-11-14 15:53:46,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,065 - INFO - Going to convert document batch...
2025-11-14 15:53:46,066 - INFO - Processing document 4_2024-11-07
2025-11-14 15:53:46,130 - INFO - Finished converting document 4_2024-11-07 in 0.11 sec.


Converted 'data\edgar_documents\CAT\4_2024-11-04' --> 'data\processed_data\CAT\4_2024-11-04.md'
Converted 'data\edgar_documents\CAT\4_2024-11-05' --> 'data\processed_data\CAT\4_2024-11-05.md'


2025-11-14 15:53:46,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,229 - INFO - Going to convert document batch...
2025-11-14 15:53:46,230 - INFO - Processing document 4_2024-11-08
2025-11-14 15:53:46,307 - INFO - Finished converting document 4_2024-11-08 in 0.12 sec.
2025-11-14 15:53:46,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2024-11-07' --> 'data\processed_data\CAT\4_2024-11-07.md'
Converted 'data\edgar_documents\CAT\4_2024-11-08' --> 'data\processed_data\CAT\4_2024-11-08.md'


2025-11-14 15:53:46,404 - INFO - Going to convert document batch...
2025-11-14 15:53:46,405 - INFO - Processing document 4_2024-11-18
2025-11-14 15:53:46,462 - INFO - Finished converting document 4_2024-11-18 in 0.11 sec.
2025-11-14 15:53:46,540 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,561 - INFO - Going to convert document batch...
2025-11-14 15:53:46,562 - INFO - Processing document 4_2024-11-26
2025-11-14 15:53:46,616 - INFO - Finished converting document 4_2024-11-26 in 0.09 sec.
2025-11-14 15:53:46,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,718 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-11-18' --> 'data\processed_data\CAT\4_2024-11-18.md'
Converted 'data\edgar_documents\CAT\4_2024-11-26' --> 'data\processed_data\CAT\4_2024-11-26.md'


2025-11-14 15:53:46,719 - INFO - Processing document 4_2024-11-27
2025-11-14 15:53:46,780 - INFO - Finished converting document 4_2024-11-27 in 0.11 sec.
2025-11-14 15:53:46,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,901 - INFO - Going to convert document batch...
2025-11-14 15:53:46,903 - INFO - Processing document 4_2024-12-02
2025-11-14 15:53:46,993 - INFO - Finished converting document 4_2024-12-02 in 0.16 sec.


Converted 'data\edgar_documents\CAT\4_2024-11-27' --> 'data\processed_data\CAT\4_2024-11-27.md'


2025-11-14 15:53:47,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:47,101 - INFO - Going to convert document batch...
2025-11-14 15:53:47,102 - INFO - Processing document 4_2024-12-03
2025-11-14 15:53:47,142 - INFO - Finished converting document 4_2024-12-03 in 0.08 sec.
2025-11-14 15:53:47,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:47,243 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-12-02' --> 'data\processed_data\CAT\4_2024-12-02.md'
Converted 'data\edgar_documents\CAT\4_2024-12-03' --> 'data\processed_data\CAT\4_2024-12-03.md'


2025-11-14 15:53:47,245 - INFO - Processing document 4_2024-12-05
2025-11-14 15:53:47,279 - INFO - Finished converting document 4_2024-12-05 in 0.09 sec.
2025-11-14 15:53:47,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:47,361 - INFO - Going to convert document batch...
2025-11-14 15:53:47,363 - INFO - Processing document 4_2024-12-06
2025-11-14 15:53:47,414 - INFO - Finished converting document 4_2024-12-06 in 0.09 sec.
2025-11-14 15:53:47,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2024-12-05' --> 'data\processed_data\CAT\4_2024-12-05.md'
Converted 'data\edgar_documents\CAT\4_2024-12-06' --> 'data\processed_data\CAT\4_2024-12-06.md'


2025-11-14 15:53:47,526 - INFO - Going to convert document batch...
2025-11-14 15:53:47,527 - INFO - Processing document 4_2024-12-27
2025-11-14 15:53:47,581 - INFO - Finished converting document 4_2024-12-27 in 0.11 sec.
2025-11-14 15:53:47,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:47,662 - INFO - Going to convert document batch...
2025-11-14 15:53:47,663 - INFO - Processing document 4_2025-01-02


Converted 'data\edgar_documents\CAT\4_2024-12-27' --> 'data\processed_data\CAT\4_2024-12-27.md'


2025-11-14 15:53:48,972 - INFO - Finished converting document 4_2025-01-02 in 1.34 sec.
2025-11-14 15:53:49,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:49,059 - INFO - Going to convert document batch...
2025-11-14 15:53:49,059 - INFO - Processing document 4_2025-01-14
2025-11-14 15:53:49,121 - INFO - Finished converting document 4_2025-01-14 in 0.11 sec.
2025-11-14 15:53:49,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-01-02' --> 'data\processed_data\CAT\4_2025-01-02.md'
Converted 'data\edgar_documents\CAT\4_2025-01-14' --> 'data\processed_data\CAT\4_2025-01-14.md'


2025-11-14 15:53:49,228 - INFO - Going to convert document batch...
2025-11-14 15:53:49,229 - INFO - Processing document 4_2025-01-17
2025-11-14 15:53:49,275 - INFO - Finished converting document 4_2025-01-17 in 0.09 sec.
2025-11-14 15:53:49,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:49,367 - INFO - Going to convert document batch...
2025-11-14 15:53:49,368 - INFO - Processing document 4_2025-02-05
2025-11-14 15:53:49,424 - INFO - Finished converting document 4_2025-02-05 in 0.09 sec.
2025-11-14 15:53:49,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-01-17' --> 'data\processed_data\CAT\4_2025-01-17.md'
Converted 'data\edgar_documents\CAT\4_2025-02-05' --> 'data\processed_data\CAT\4_2025-02-05.md'


2025-11-14 15:53:49,541 - INFO - Going to convert document batch...
2025-11-14 15:53:49,543 - INFO - Processing document 4_2025-02-13
2025-11-14 15:53:49,606 - INFO - Finished converting document 4_2025-02-13 in 0.12 sec.
2025-11-14 15:53:49,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:49,706 - INFO - Going to convert document batch...
2025-11-14 15:53:49,707 - INFO - Processing document 4_2025-02-19
2025-11-14 15:53:49,771 - INFO - Finished converting document 4_2025-02-19 in 0.11 sec.
2025-11-14 15:53:49,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-02-13' --> 'data\processed_data\CAT\4_2025-02-13.md'
Converted 'data\edgar_documents\CAT\4_2025-02-19' --> 'data\processed_data\CAT\4_2025-02-19.md'


2025-11-14 15:53:49,882 - INFO - Going to convert document batch...
2025-11-14 15:53:49,884 - INFO - Processing document 4_2025-03-05
2025-11-14 15:53:49,948 - INFO - Finished converting document 4_2025-03-05 in 0.11 sec.
2025-11-14 15:53:50,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:50,050 - INFO - Going to convert document batch...
2025-11-14 15:53:50,051 - INFO - Processing document 4_2025-03-10
2025-11-14 15:53:50,105 - INFO - Finished converting document 4_2025-03-10 in 0.09 sec.
2025-11-14 15:53:50,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:50,211 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2025-03-05' --> 'data\processed_data\CAT\4_2025-03-05.md'
Converted 'data\edgar_documents\CAT\4_2025-03-10' --> 'data\processed_data\CAT\4_2025-03-10.md'


2025-11-14 15:53:50,213 - INFO - Processing document 4_2025-03-17
2025-11-14 15:53:50,286 - INFO - Finished converting document 4_2025-03-17 in 0.11 sec.
2025-11-14 15:53:50,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:50,495 - INFO - Going to convert document batch...
2025-11-14 15:53:50,497 - INFO - Processing document 4_2025-04-02
2025-11-14 15:53:50,558 - INFO - Finished converting document 4_2025-04-02 in 0.16 sec.


Converted 'data\edgar_documents\CAT\4_2025-03-17' --> 'data\processed_data\CAT\4_2025-03-17.md'


2025-11-14 15:53:50,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:50,666 - INFO - Going to convert document batch...
2025-11-14 15:53:50,667 - INFO - Processing document 4_2025-04-22
2025-11-14 15:53:50,728 - INFO - Finished converting document 4_2025-04-22 in 0.09 sec.
2025-11-14 15:53:50,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-04-02' --> 'data\processed_data\CAT\4_2025-04-02.md'
Converted 'data\edgar_documents\CAT\4_2025-04-22' --> 'data\processed_data\CAT\4_2025-04-22.md'


2025-11-14 15:53:50,834 - INFO - Going to convert document batch...
2025-11-14 15:53:50,837 - INFO - Processing document 4_2025-04-28
2025-11-14 15:53:50,913 - INFO - Finished converting document 4_2025-04-28 in 0.12 sec.
2025-11-14 15:53:51,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:51,040 - INFO - Going to convert document batch...
2025-11-14 15:53:51,041 - INFO - Processing document 4_2025-05-05
2025-11-14 15:53:51,102 - INFO - Finished converting document 4_2025-05-05 in 0.11 sec.
2025-11-14 15:53:51,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-04-28' --> 'data\processed_data\CAT\4_2025-04-28.md'
Converted 'data\edgar_documents\CAT\4_2025-05-05' --> 'data\processed_data\CAT\4_2025-05-05.md'


2025-11-14 15:53:51,203 - INFO - Going to convert document batch...
2025-11-14 15:53:51,205 - INFO - Processing document 4_2025-05-08
2025-11-14 15:53:51,267 - INFO - Finished converting document 4_2025-05-08 in 0.11 sec.
2025-11-14 15:53:51,354 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:53:51,355 - ERROR - Input document 4_2025-05-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:53:51,358 - INFO - Going to convert document batch...
2025-11-14 15:53:51,380 - IN

Converted 'data\edgar_documents\CAT\4_2025-05-08' --> 'data\processed_data\CAT\4_2025-05-08.md'
Error processing data\edgar_documents\CAT\4_2025-05-12: File format not allowed: data\edgar_documents\CAT\4_2025-05-12
Converted 'data\edgar_documents\CAT\4_2025-05-13' --> 'data\processed_data\CAT\4_2025-05-13.md'


2025-11-14 15:53:51,568 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:53:51,568 - ERROR - Input document 4_2025-05-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:53:51,570 - INFO - Going to convert document batch...
2025-11-14 15:53:51,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:51,608 - INFO - Going to convert document batch...
2025-11-14 15:53:51,609 - INFO - Processing document 4_2025-05-27
2025-11-14 15:53:51,657 - INFO - Fin

Error processing data\edgar_documents\CAT\4_2025-05-14: File format not allowed: data\edgar_documents\CAT\4_2025-05-14
Converted 'data\edgar_documents\CAT\4_2025-05-27' --> 'data\processed_data\CAT\4_2025-05-27.md'


2025-11-14 15:53:51,796 - INFO - Finished converting document 4_2025-06-13 in 0.09 sec.
2025-11-14 15:53:51,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:51,883 - INFO - Going to convert document batch...
2025-11-14 15:53:51,885 - INFO - Processing document 4_2025-06-27
2025-11-14 15:53:51,930 - INFO - Finished converting document 4_2025-06-27 in 0.08 sec.
2025-11-14 15:53:52,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,020 - INFO - Going to convert document batch...
2025-11-14 15:53:52,021 - INFO - Processing document 4_2025-07-02


Converted 'data\edgar_documents\CAT\4_2025-06-13' --> 'data\processed_data\CAT\4_2025-06-13.md'
Converted 'data\edgar_documents\CAT\4_2025-06-27' --> 'data\processed_data\CAT\4_2025-06-27.md'


2025-11-14 15:53:52,067 - INFO - Finished converting document 4_2025-07-02 in 0.09 sec.
2025-11-14 15:53:52,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,153 - INFO - Going to convert document batch...
2025-11-14 15:53:52,154 - INFO - Processing document 4_2025-07-21
2025-11-14 15:53:52,213 - INFO - Finished converting document 4_2025-07-21 in 0.11 sec.
2025-11-14 15:53:52,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-07-02' --> 'data\processed_data\CAT\4_2025-07-02.md'
Converted 'data\edgar_documents\CAT\4_2025-07-21' --> 'data\processed_data\CAT\4_2025-07-21.md'


2025-11-14 15:53:52,342 - INFO - Going to convert document batch...
2025-11-14 15:53:52,344 - INFO - Processing document 4_2025-07-28
2025-11-14 15:53:52,398 - INFO - Finished converting document 4_2025-07-28 in 0.11 sec.
2025-11-14 15:53:52,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,479 - INFO - Going to convert document batch...
2025-11-14 15:53:52,480 - INFO - Processing document 4_2025-08-08
2025-11-14 15:53:52,538 - INFO - Finished converting document 4_2025-08-08 in 0.09 sec.
2025-11-14 15:53:52,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,644 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2025-07-28' --> 'data\processed_data\CAT\4_2025-07-28.md'
Converted 'data\edgar_documents\CAT\4_2025-08-08' --> 'data\processed_data\CAT\4_2025-08-08.md'


2025-11-14 15:53:52,647 - INFO - Processing document 4_2025-08-13
2025-11-14 15:53:52,720 - INFO - Finished converting document 4_2025-08-13 in 0.14 sec.
2025-11-14 15:53:52,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,812 - INFO - Going to convert document batch...
2025-11-14 15:53:52,813 - INFO - Processing document 4_2025-08-19
2025-11-14 15:53:52,861 - INFO - Finished converting document 4_2025-08-19 in 0.08 sec.
2025-11-14 15:53:52,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,956 - INFO - Going to convert document batch...
2025-11-14 15:53:52,957 - INFO - Processing document 4_2025-08-27


Converted 'data\edgar_documents\CAT\4_2025-08-13' --> 'data\processed_data\CAT\4_2025-08-13.md'
Converted 'data\edgar_documents\CAT\4_2025-08-19' --> 'data\processed_data\CAT\4_2025-08-19.md'


2025-11-14 15:53:53,014 - INFO - Finished converting document 4_2025-08-27 in 0.11 sec.
2025-11-14 15:53:53,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,108 - INFO - Going to convert document batch...
2025-11-14 15:53:53,109 - INFO - Processing document 4_2025-09-03
2025-11-14 15:53:53,164 - INFO - Finished converting document 4_2025-09-03 in 0.09 sec.
2025-11-14 15:53:53,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-08-27' --> 'data\processed_data\CAT\4_2025-08-27.md'
Converted 'data\edgar_documents\CAT\4_2025-09-03' --> 'data\processed_data\CAT\4_2025-09-03.md'


2025-11-14 15:53:53,269 - INFO - Going to convert document batch...
2025-11-14 15:53:53,271 - INFO - Processing document 4_2025-09-23
2025-11-14 15:53:53,312 - INFO - Finished converting document 4_2025-09-23 in 0.09 sec.
2025-11-14 15:53:53,370 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,387 - INFO - Going to convert document batch...
2025-11-14 15:53:53,388 - INFO - Processing document 4_2025-09-29
2025-11-14 15:53:53,432 - INFO - Finished converting document 4_2025-09-29 in 0.06 sec.
2025-11-14 15:53:53,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,527 - INFO - Going to convert document batch...
2025-11-14 15:53:53,530 - INFO - Processing document 4_2025-10-01


Converted 'data\edgar_documents\CAT\4_2025-09-23' --> 'data\processed_data\CAT\4_2025-09-23.md'
Converted 'data\edgar_documents\CAT\4_2025-09-29' --> 'data\processed_data\CAT\4_2025-09-29.md'


2025-11-14 15:53:53,585 - INFO - Finished converting document 4_2025-10-01 in 0.11 sec.
2025-11-14 15:53:53,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,680 - INFO - Going to convert document batch...
2025-11-14 15:53:53,681 - INFO - Processing document 4_2025-10-14
2025-11-14 15:53:53,747 - INFO - Finished converting document 4_2025-10-14 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2025-10-01' --> 'data\processed_data\CAT\4_2025-10-01.md'
Converted 'data\edgar_documents\CAT\4_2025-10-14' --> 'data\processed_data\CAT\4_2025-10-14.md'


2025-11-14 15:53:53,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,874 - INFO - Going to convert document batch...
2025-11-14 15:53:53,876 - INFO - Processing document 4_2025-10-27
2025-11-14 15:53:53,929 - INFO - Finished converting document 4_2025-10-27 in 0.11 sec.
2025-11-14 15:53:53,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,004 - INFO - Going to convert document batch...
2025-11-14 15:53:54,005 - INFO - Processing document 4_2025-11-06
2025-11-14 15:53:54,060 - INFO - Finished converting document 4_2025-11-06 in 0.09 sec.
2025-11-14 15:53:54,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,152 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2025-10-27' --> 'data\processed_data\CAT\4_2025-10-27.md'
Converted 'data\edgar_documents\CAT\4_2025-11-06' --> 'data\processed_data\CAT\4_2025-11-06.md'


2025-11-14 15:53:54,153 - INFO - Processing document 4_2025-11-07
2025-11-14 15:53:54,206 - INFO - Finished converting document 4_2025-11-07 in 0.09 sec.
2025-11-14 15:53:54,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,354 - INFO - Going to convert document batch...
2025-11-14 15:53:54,355 - INFO - Processing document 8-K_2023-01-31
2025-11-14 15:53:54,422 - INFO - Finished converting document 8-K_2023-01-31 in 0.14 sec.


Converted 'data\edgar_documents\CAT\4_2025-11-07' --> 'data\processed_data\CAT\4_2025-11-07.md'


2025-11-14 15:53:54,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,628 - INFO - Going to convert document batch...
2025-11-14 15:53:54,629 - INFO - Processing document 8-K_2023-02-02
2025-11-14 15:53:54,689 - INFO - Finished converting document 8-K_2023-02-02 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-01-31' --> 'data\processed_data\CAT\8-K_2023-01-31.md'


2025-11-14 15:53:54,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,862 - INFO - Going to convert document batch...
2025-11-14 15:53:54,863 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:53:54,919 - INFO - Finished converting document 8-K_2023-04-27 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-02-02' --> 'data\processed_data\CAT\8-K_2023-02-02.md'


2025-11-14 15:53:55,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:55,127 - INFO - Going to convert document batch...
2025-11-14 15:53:55,129 - INFO - Processing document 8-K_2023-06-20
2025-11-14 15:53:55,239 - INFO - Finished converting document 8-K_2023-06-20 in 0.17 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-04-27' --> 'data\processed_data\CAT\8-K_2023-04-27.md'


2025-11-14 15:53:55,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:55,371 - INFO - Going to convert document batch...
2025-11-14 15:53:55,373 - INFO - Processing document 8-K_2023-08-01
2025-11-14 15:53:55,435 - INFO - Finished converting document 8-K_2023-08-01 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-06-20' --> 'data\processed_data\CAT\8-K_2023-06-20.md'


2025-11-14 15:53:55,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:55,643 - INFO - Going to convert document batch...
2025-11-14 15:53:55,645 - INFO - Processing document 8-K_2023-08-09
2025-11-14 15:53:55,707 - INFO - Finished converting document 8-K_2023-08-09 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-08-01' --> 'data\processed_data\CAT\8-K_2023-08-01.md'


2025-11-14 15:53:55,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:55,895 - INFO - Going to convert document batch...
2025-11-14 15:53:55,896 - INFO - Processing document 8-K_2023-09-01
2025-11-14 15:53:56,009 - INFO - Finished converting document 8-K_2023-09-01 in 0.16 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-08-09' --> 'data\processed_data\CAT\8-K_2023-08-09.md'


2025-11-14 15:53:56,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:56,134 - INFO - Going to convert document batch...
2025-11-14 15:53:56,136 - INFO - Processing document 8-K_2023-10-16
2025-11-14 15:53:56,191 - INFO - Finished converting document 8-K_2023-10-16 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-09-01' --> 'data\processed_data\CAT\8-K_2023-09-01.md'


2025-11-14 15:53:56,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:56,385 - INFO - Going to convert document batch...
2025-11-14 15:53:56,387 - INFO - Processing document 8-K_2023-10-31
2025-11-14 15:53:56,454 - INFO - Finished converting document 8-K_2023-10-31 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-10-16' --> 'data\processed_data\CAT\8-K_2023-10-16.md'


2025-11-14 15:53:56,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:56,663 - INFO - Going to convert document batch...
2025-11-14 15:53:56,665 - INFO - Processing document 8-K_2023-12-14
2025-11-14 15:53:56,725 - INFO - Finished converting document 8-K_2023-12-14 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-10-31' --> 'data\processed_data\CAT\8-K_2023-10-31.md'


2025-11-14 15:53:56,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:56,919 - INFO - Going to convert document batch...
2025-11-14 15:53:56,921 - INFO - Processing document 8-K_2024-02-05
2025-11-14 15:53:56,978 - INFO - Finished converting document 8-K_2024-02-05 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-12-14' --> 'data\processed_data\CAT\8-K_2023-12-14.md'


2025-11-14 15:53:57,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:57,155 - INFO - Going to convert document batch...
2025-11-14 15:53:57,156 - INFO - Processing document 8-K_2024-04-03
2025-11-14 15:53:57,211 - INFO - Finished converting document 8-K_2024-04-03 in 0.09 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-02-05' --> 'data\processed_data\CAT\8-K_2024-02-05.md'


2025-11-14 15:53:57,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:57,405 - INFO - Going to convert document batch...
2025-11-14 15:53:57,407 - INFO - Processing document 8-K_2024-04-25
2025-11-14 15:53:57,498 - INFO - Finished converting document 8-K_2024-04-25 in 0.14 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-04-03' --> 'data\processed_data\CAT\8-K_2024-04-03.md'


2025-11-14 15:53:57,667 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:57,705 - INFO - Going to convert document batch...
2025-11-14 15:53:57,706 - INFO - Processing document 8-K_2024-06-14
2025-11-14 15:53:57,785 - INFO - Finished converting document 8-K_2024-06-14 in 0.14 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-04-25' --> 'data\processed_data\CAT\8-K_2024-04-25.md'
Converted 'data\edgar_documents\CAT\8-K_2024-06-14' --> 'data\processed_data\CAT\8-K_2024-06-14.md'


2025-11-14 15:53:57,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:57,902 - INFO - Going to convert document batch...
2025-11-14 15:53:57,904 - INFO - Processing document 8-K_2024-08-06
2025-11-14 15:53:57,970 - INFO - Finished converting document 8-K_2024-08-06 in 0.12 sec.
2025-11-14 15:53:58,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:58,164 - INFO - Going to convert document batch...
2025-11-14 15:53:58,165 - INFO - Processing document 8-K_2024-09-04


Converted 'data\edgar_documents\CAT\8-K_2024-08-06' --> 'data\processed_data\CAT\8-K_2024-08-06.md'


2025-11-14 15:53:58,768 - INFO - Finished converting document 8-K_2024-09-04 in 0.66 sec.
2025-11-14 15:53:58,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:58,877 - INFO - Going to convert document batch...
2025-11-14 15:53:58,878 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:53:58,925 - INFO - Finished converting document 8-K_2024-10-11 in 0.09 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-09-04' --> 'data\processed_data\CAT\8-K_2024-09-04.md'


2025-11-14 15:53:59,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:59,148 - INFO - Going to convert document batch...
2025-11-14 15:53:59,150 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:53:59,230 - INFO - Finished converting document 8-K_2024-10-30 in 0.14 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-10-11' --> 'data\processed_data\CAT\8-K_2024-10-11.md'


2025-11-14 15:53:59,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:59,402 - INFO - Going to convert document batch...
2025-11-14 15:53:59,404 - INFO - Processing document 8-K_2025-01-30
2025-11-14 15:53:59,454 - INFO - Finished converting document 8-K_2025-01-30 in 0.09 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-10-30' --> 'data\processed_data\CAT\8-K_2024-10-30.md'


2025-11-14 15:53:59,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:59,609 - INFO - Going to convert document batch...
2025-11-14 15:53:59,610 - INFO - Processing document 8-K_2025-04-09
2025-11-14 15:53:59,683 - INFO - Finished converting document 8-K_2025-04-09 in 0.12 sec.
2025-11-14 15:53:59,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\8-K_2025-01-30' --> 'data\processed_data\CAT\8-K_2025-01-30.md'
Converted 'data\edgar_documents\CAT\8-K_2025-04-09' --> 'data\processed_data\CAT\8-K_2025-04-09.md'


2025-11-14 15:53:59,786 - INFO - Going to convert document batch...
2025-11-14 15:53:59,787 - INFO - Processing document 8-K_2025-04-15
2025-11-14 15:53:59,845 - INFO - Finished converting document 8-K_2025-04-15 in 0.12 sec.
2025-11-14 15:53:59,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:59,971 - INFO - Going to convert document batch...
2025-11-14 15:53:59,973 - INFO - Processing document 8-K_2025-04-30
2025-11-14 15:54:00,046 - INFO - Finished converting document 8-K_2025-04-30 in 0.14 sec.


Converted 'data\edgar_documents\CAT\8-K_2025-04-15' --> 'data\processed_data\CAT\8-K_2025-04-15.md'


2025-11-14 15:54:00,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:54:00,276 - INFO - Going to convert document batch...
2025-11-14 15:54:00,278 - INFO - Processing document 8-K_2025-05-15
2025-11-14 15:54:00,349 - INFO - Finished converting document 8-K_2025-05-15 in 0.12 sec.
2025-11-14 15:54:00,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\8-K_2025-04-30' --> 'data\processed_data\CAT\8-K_2025-04-30.md'
Converted 'data\edgar_documents\CAT\8-K_2025-05-15' --> 'data\processed_data\CAT\8-K_2025-05-15.md'


2025-11-14 15:54:00,454 - INFO - Going to convert document batch...
2025-11-14 15:54:00,455 - INFO - Processing document 8-K_2025-06-12
2025-11-14 15:54:00,552 - INFO - Finished converting document 8-K_2025-06-12 in 0.16 sec.
2025-11-14 15:54:00,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:54:00,671 - INFO - Going to convert document batch...
2025-11-14 15:54:00,672 - INFO - Processing document 8-K_2025-08-05
2025-11-14 15:54:00,731 - INFO - Finished converting document 8-K_2025-08-05 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2025-06-12' --> 'data\processed_data\CAT\8-K_2025-06-12.md'


2025-11-14 15:54:00,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:54:00,908 - INFO - Going to convert document batch...
2025-11-14 15:54:00,909 - INFO - Processing document 8-K_2025-08-28
2025-11-14 15:54:00,966 - INFO - Finished converting document 8-K_2025-08-28 in 0.11 sec.
2025-11-14 15:54:01,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\8-K_2025-08-05' --> 'data\processed_data\CAT\8-K_2025-08-05.md'
Converted 'data\edgar_documents\CAT\8-K_2025-08-28' --> 'data\processed_data\CAT\8-K_2025-08-28.md'


2025-11-14 15:54:01,073 - INFO - Going to convert document batch...
2025-11-14 15:54:01,075 - INFO - Processing document 8-K_2025-09-03
2025-11-14 15:54:01,178 - INFO - Finished converting document 8-K_2025-09-03 in 0.16 sec.
2025-11-14 15:54:01,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:54:01,286 - INFO - Going to convert document batch...
2025-11-14 15:54:01,287 - INFO - Processing document 8-K_2025-10-29
2025-11-14 15:54:01,341 - INFO - Finished converting document 8-K_2025-10-29 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2025-09-03' --> 'data\processed_data\CAT\8-K_2025-09-03.md'


2025-11-14 15:54:01,573 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:54:01,574 - ERROR - Input document DEF-14A_2023-05-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:54:01,581 - INFO - Going to convert document batch...
2025-11-14 15:54:01,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\8-K_2025-10-29' --> 'data\processed_data\CAT\8-K_2025-10-29.md'
Error processing data\edgar_documents\CAT\DEF-14A_2023-05-01: File format not allowed: data\edgar_documents\CAT\DEF-14A_2023-05-01


2025-11-14 15:54:02,571 - INFO - Going to convert document batch...
2025-11-14 15:54:02,572 - INFO - Processing document DEF-14A_2024-04-29
2025-11-14 15:54:05,655 - INFO - Finished converting document DEF-14A_2024-04-29 in 4.08 sec.
2025-11-14 15:54:07,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\DEF-14A_2024-04-29' --> 'data\processed_data\CAT\DEF-14A_2024-04-29.md'


2025-11-14 15:54:08,493 - INFO - Going to convert document batch...
2025-11-14 15:54:08,494 - INFO - Processing document DEF-14A_2025-04-30
2025-11-14 15:54:31,173 - INFO - Finished converting document DEF-14A_2025-04-30 in 23.72 sec.
2025-11-14 15:54:33,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\DEF-14A_2025-04-30' --> 'data\processed_data\CAT\DEF-14A_2025-04-30.md'
Processed 162 new files. Errors: 3
Found 168 files to process in data\edgar_documents\CHTR


2025-11-14 15:54:34,830 - INFO - Going to convert document batch...
2025-11-14 15:54:34,831 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:54:34,832 - INFO - Processing document 10-K_2023-01-27
2025-11-14 15:54:40,269 - INFO - Finished converting document 10-K_2023-01-27 in 6.77 sec.
2025-11-14 15:54:41,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-K_2023-01-27' --> 'data\processed_data\CHTR\10-K_2023-01-27.md'


2025-11-14 15:54:43,158 - INFO - Going to convert document batch...
2025-11-14 15:54:43,159 - INFO - Processing document 10-K_2024-02-02
2025-11-14 15:54:48,257 - INFO - Finished converting document 10-K_2024-02-02 in 6.58 sec.
2025-11-14 15:54:49,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-K_2024-02-02' --> 'data\processed_data\CHTR\10-K_2024-02-02.md'


2025-11-14 15:54:51,223 - INFO - Going to convert document batch...
2025-11-14 15:54:51,224 - INFO - Processing document 10-K_2025-01-31
2025-11-14 15:54:56,198 - INFO - Finished converting document 10-K_2025-01-31 in 6.52 sec.
2025-11-14 15:54:57,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-K_2025-01-31' --> 'data\processed_data\CHTR\10-K_2025-01-31.md'


2025-11-14 15:54:59,035 - INFO - Going to convert document batch...
2025-11-14 15:54:59,036 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 15:55:00,171 - INFO - Finished converting document 10-Q_2023-04-28 in 2.56 sec.
2025-11-14 15:55:00,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2023-04-28' --> 'data\processed_data\CHTR\10-Q_2023-04-28.md'


2025-11-14 15:55:01,426 - INFO - Going to convert document batch...
2025-11-14 15:55:01,429 - INFO - Processing document 10-Q_2023-07-28
2025-11-14 15:55:02,778 - INFO - Finished converting document 10-Q_2023-07-28 in 2.11 sec.
2025-11-14 15:55:03,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2023-07-28' --> 'data\processed_data\CHTR\10-Q_2023-07-28.md'


2025-11-14 15:55:04,228 - INFO - Going to convert document batch...
2025-11-14 15:55:04,229 - INFO - Processing document 10-Q_2023-10-27
2025-11-14 15:55:05,843 - INFO - Finished converting document 10-Q_2023-10-27 in 2.36 sec.
2025-11-14 15:55:06,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2023-10-27' --> 'data\processed_data\CHTR\10-Q_2023-10-27.md'


2025-11-14 15:55:07,667 - INFO - Going to convert document batch...
2025-11-14 15:55:07,668 - INFO - Processing document 10-Q_2024-04-26
2025-11-14 15:55:08,654 - INFO - Finished converting document 10-Q_2024-04-26 in 2.30 sec.
2025-11-14 15:55:09,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2024-04-26' --> 'data\processed_data\CHTR\10-Q_2024-04-26.md'


2025-11-14 15:55:09,945 - INFO - Going to convert document batch...
2025-11-14 15:55:09,946 - INFO - Processing document 10-Q_2024-07-26
2025-11-14 15:55:11,068 - INFO - Finished converting document 10-Q_2024-07-26 in 1.84 sec.
2025-11-14 15:55:11,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2024-07-26' --> 'data\processed_data\CHTR\10-Q_2024-07-26.md'


2025-11-14 15:55:12,738 - INFO - Going to convert document batch...
2025-11-14 15:55:12,739 - INFO - Processing document 10-Q_2024-11-01
2025-11-14 15:55:13,827 - INFO - Finished converting document 10-Q_2024-11-01 in 2.25 sec.
2025-11-14 15:55:14,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2024-11-01' --> 'data\processed_data\CHTR\10-Q_2024-11-01.md'


2025-11-14 15:55:14,969 - INFO - Going to convert document batch...
2025-11-14 15:55:14,971 - INFO - Processing document 10-Q_2025-04-25
2025-11-14 15:55:16,202 - INFO - Finished converting document 10-Q_2025-04-25 in 1.75 sec.
2025-11-14 15:55:16,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2025-04-25' --> 'data\processed_data\CHTR\10-Q_2025-04-25.md'


2025-11-14 15:55:17,510 - INFO - Going to convert document batch...
2025-11-14 15:55:17,511 - INFO - Processing document 10-Q_2025-07-25
2025-11-14 15:55:18,916 - INFO - Finished converting document 10-Q_2025-07-25 in 2.19 sec.
2025-11-14 15:55:19,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2025-07-25' --> 'data\processed_data\CHTR\10-Q_2025-07-25.md'


2025-11-14 15:55:20,750 - INFO - Going to convert document batch...
2025-11-14 15:55:20,751 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 15:55:22,011 - INFO - Finished converting document 10-Q_2025-10-31 in 2.58 sec.
2025-11-14 15:55:22,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:22,555 - INFO - Going to convert document batch...
2025-11-14 15:55:22,558 - INFO - Processing document 4_2023-01-06
2025-11-14 15:55:22,597 - INFO - Finished converting document 4_2023-01-06 in 0.08 sec.
2025-11-14 15:55:22,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:22,673 - INFO - Going to convert document batch...
2025-11-14 15:55:22,674 - INFO - Processing document 4_2023-01-18
2025-11-14 15:55:22,706 - INFO - Finished converting document 4_2023-01-18 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\10-Q_2025-10-31' --> 'data\processed_data\CHTR\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\CHTR\4_2023-01-06' --> 'data\processed_data\CHTR\4_2023-01-06.md'


2025-11-14 15:55:22,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:22,787 - INFO - Going to convert document batch...
2025-11-14 15:55:22,788 - INFO - Processing document 4_2023-01-19
2025-11-14 15:55:22,862 - INFO - Finished converting document 4_2023-01-19 in 0.12 sec.
2025-11-14 15:55:22,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2023-01-18' --> 'data\processed_data\CHTR\4_2023-01-18.md'
Converted 'data\edgar_documents\CHTR\4_2023-01-19' --> 'data\processed_data\CHTR\4_2023-01-19.md'


2025-11-14 15:55:22,958 - INFO - Going to convert document batch...
2025-11-14 15:55:22,959 - INFO - Processing document 4_2023-02-01
2025-11-14 15:55:22,992 - INFO - Finished converting document 4_2023-02-01 in 0.06 sec.
2025-11-14 15:55:23,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,053 - INFO - Going to convert document batch...
2025-11-14 15:55:23,054 - INFO - Processing document 4_2023-02-03
2025-11-14 15:55:23,088 - INFO - Finished converting document 4_2023-02-03 in 0.08 sec.
2025-11-14 15:55:23,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,155 - INFO - Going to convert document batch...
2025-11-14 15:55:23,156 - INFO - Processing document 4_2023-02-24
2025-11-14 15:55:23,197 - INFO - Finished converting document 4_2023-02-24 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2023-02-01' --> 'data\processed_data\CHTR\4_2023-02-01.md'
Converted 'data\edgar_documents\CHTR\4_2023-02-03' --> 'data\processed_data\CHTR\4_2023-02-03.md'


2025-11-14 15:55:23,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,272 - INFO - Going to convert document batch...
2025-11-14 15:55:23,273 - INFO - Processing document 4_2023-03-01
2025-11-14 15:55:23,327 - INFO - Finished converting document 4_2023-03-01 in 0.09 sec.
2025-11-14 15:55:23,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,426 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2023-02-24' --> 'data\processed_data\CHTR\4_2023-02-24.md'
Converted 'data\edgar_documents\CHTR\4_2023-03-01' --> 'data\processed_data\CHTR\4_2023-03-01.md'


2025-11-14 15:55:23,428 - INFO - Processing document 4_2023-03-06
2025-11-14 15:55:23,464 - INFO - Finished converting document 4_2023-03-06 in 0.08 sec.
2025-11-14 15:55:23,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,533 - INFO - Going to convert document batch...
2025-11-14 15:55:23,534 - INFO - Processing document 4_2023-03-21
2025-11-14 15:55:23,575 - INFO - Finished converting document 4_2023-03-21 in 0.08 sec.
2025-11-14 15:55:23,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,659 - INFO - Going to convert document batch...
2025-11-14 15:55:23,659 - INFO - Processing document 4_2023-04-07
2025-11-14 15:55:23,698 - INFO - Finished converting document 4_2023-04-07 in 0.08 sec.


Converted 'data\edgar_documents\CHTR\4_2023-03-06' --> 'data\processed_data\CHTR\4_2023-03-06.md'
Converted 'data\edgar_documents\CHTR\4_2023-03-21' --> 'data\processed_data\CHTR\4_2023-03-21.md'


2025-11-14 15:55:23,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,788 - INFO - Going to convert document batch...
2025-11-14 15:55:23,789 - INFO - Processing document 4_2023-04-26
2025-11-14 15:55:23,831 - INFO - Finished converting document 4_2023-04-26 in 0.08 sec.
2025-11-14 15:55:23,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,920 - INFO - Going to convert document batch...
2025-11-14 15:55:23,923 - INFO - Processing document 4_2023-05-08


Converted 'data\edgar_documents\CHTR\4_2023-04-07' --> 'data\processed_data\CHTR\4_2023-04-07.md'
Converted 'data\edgar_documents\CHTR\4_2023-04-26' --> 'data\processed_data\CHTR\4_2023-04-26.md'


2025-11-14 15:55:23,961 - INFO - Finished converting document 4_2023-05-08 in 0.08 sec.
2025-11-14 15:55:24,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,045 - INFO - Going to convert document batch...
2025-11-14 15:55:24,051 - INFO - Processing document 4_2023-05-16
2025-11-14 15:55:24,104 - INFO - Finished converting document 4_2023-05-16 in 0.09 sec.
2025-11-14 15:55:24,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,184 - INFO - Going to convert document batch...
2025-11-14 15:55:24,186 - INFO - Processing document 4_2023-06-07


Converted 'data\edgar_documents\CHTR\4_2023-05-08' --> 'data\processed_data\CHTR\4_2023-05-08.md'
Converted 'data\edgar_documents\CHTR\4_2023-05-16' --> 'data\processed_data\CHTR\4_2023-05-16.md'


2025-11-14 15:55:24,228 - INFO - Finished converting document 4_2023-06-07 in 0.06 sec.
2025-11-14 15:55:24,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,330 - INFO - Going to convert document batch...
2025-11-14 15:55:24,330 - INFO - Processing document 4_2023-06-16
2025-11-14 15:55:24,431 - INFO - Finished converting document 4_2023-06-16 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2023-06-07' --> 'data\processed_data\CHTR\4_2023-06-07.md'


2025-11-14 15:55:24,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,554 - INFO - Going to convert document batch...
2025-11-14 15:55:24,556 - INFO - Processing document 4_2023-07-05
2025-11-14 15:55:24,604 - INFO - Finished converting document 4_2023-07-05 in 0.09 sec.
2025-11-14 15:55:24,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,697 - INFO - Going to convert document batch...
2025-11-14 15:55:24,698 - INFO - Processing document 4_2023-07-06


Converted 'data\edgar_documents\CHTR\4_2023-06-16' --> 'data\processed_data\CHTR\4_2023-06-16.md'
Converted 'data\edgar_documents\CHTR\4_2023-07-05' --> 'data\processed_data\CHTR\4_2023-07-05.md'


2025-11-14 15:55:24,744 - INFO - Finished converting document 4_2023-07-06 in 0.08 sec.
2025-11-14 15:55:24,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,844 - INFO - Going to convert document batch...
2025-11-14 15:55:24,845 - INFO - Processing document 4_2023-07-07
2025-11-14 15:55:24,925 - INFO - Finished converting document 4_2023-07-07 in 0.12 sec.


Converted 'data\edgar_documents\CHTR\4_2023-07-06' --> 'data\processed_data\CHTR\4_2023-07-06.md'


2025-11-14 15:55:25,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:25,053 - INFO - Going to convert document batch...
2025-11-14 15:55:25,054 - INFO - Processing document 4_2023-07-25
2025-11-14 15:55:25,148 - INFO - Finished converting document 4_2023-07-25 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2023-07-07' --> 'data\processed_data\CHTR\4_2023-07-07.md'


2025-11-14 15:55:25,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:25,244 - INFO - Going to convert document batch...
2025-11-14 15:55:25,245 - INFO - Processing document 4_2023-08-04
2025-11-14 15:55:25,279 - INFO - Finished converting document 4_2023-08-04 in 0.06 sec.
2025-11-14 15:55:25,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:25,378 - INFO - Going to convert document batch...
2025-11-14 15:55:25,379 - INFO - Processing document 4_2023-08-07


Converted 'data\edgar_documents\CHTR\4_2023-07-25' --> 'data\processed_data\CHTR\4_2023-07-25.md'
Converted 'data\edgar_documents\CHTR\4_2023-08-04' --> 'data\processed_data\CHTR\4_2023-08-04.md'


2025-11-14 15:55:25,463 - INFO - Finished converting document 4_2023-08-07 in 0.14 sec.
2025-11-14 15:55:25,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:25,645 - INFO - Going to convert document batch...
2025-11-14 15:55:25,646 - INFO - Processing document 4_2023-08-17


Converted 'data\edgar_documents\CHTR\4_2023-08-07' --> 'data\processed_data\CHTR\4_2023-08-07.md'


2025-11-14 15:55:25,861 - INFO - Finished converting document 4_2023-08-17 in 0.31 sec.
2025-11-14 15:55:25,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:26,006 - INFO - Going to convert document batch...
2025-11-14 15:55:26,007 - INFO - Processing document 4_2023-08-18
2025-11-14 15:55:26,045 - INFO - Finished converting document 4_2023-08-18 in 0.08 sec.
2025-11-14 15:55:26,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2023-08-17' --> 'data\processed_data\CHTR\4_2023-08-17.md'
Converted 'data\edgar_documents\CHTR\4_2023-08-18' --> 'data\processed_data\CHTR\4_2023-08-18.md'


2025-11-14 15:55:26,173 - INFO - Going to convert document batch...
2025-11-14 15:55:26,174 - INFO - Processing document 4_2023-08-22
2025-11-14 15:55:26,964 - INFO - Finished converting document 4_2023-08-22 in 0.89 sec.
2025-11-14 15:55:27,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:27,212 - INFO - Going to convert document batch...
2025-11-14 15:55:27,214 - INFO - Processing document 4_2023-08-25


Converted 'data\edgar_documents\CHTR\4_2023-08-22' --> 'data\processed_data\CHTR\4_2023-08-22.md'


2025-11-14 15:55:27,399 - INFO - Finished converting document 4_2023-08-25 in 0.27 sec.
2025-11-14 15:55:27,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:27,563 - INFO - Going to convert document batch...
2025-11-14 15:55:27,563 - INFO - Processing document 4_2023-08-29
2025-11-14 15:55:27,623 - INFO - Finished converting document 4_2023-08-29 in 0.11 sec.
2025-11-14 15:55:27,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2023-08-25' --> 'data\processed_data\CHTR\4_2023-08-25.md'
Converted 'data\edgar_documents\CHTR\4_2023-08-29' --> 'data\processed_data\CHTR\4_2023-08-29.md'


2025-11-14 15:55:27,798 - INFO - Going to convert document batch...
2025-11-14 15:55:27,799 - INFO - Processing document 4_2023-08-30
2025-11-14 15:55:28,010 - INFO - Finished converting document 4_2023-08-30 in 0.34 sec.
2025-11-14 15:55:28,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,184 - INFO - Going to convert document batch...
2025-11-14 15:55:28,186 - INFO - Processing document 4_2023-09-08
2025-11-14 15:55:28,248 - INFO - Finished converting document 4_2023-09-08 in 0.11 sec.
2025-11-14 15:55:28,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,323 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2023-08-30' --> 'data\processed_data\CHTR\4_2023-08-30.md'
Converted 'data\edgar_documents\CHTR\4_2023-09-08' --> 'data\processed_data\CHTR\4_2023-09-08.md'


2025-11-14 15:55:28,325 - INFO - Processing document 4_2023-10-05
2025-11-14 15:55:28,366 - INFO - Finished converting document 4_2023-10-05 in 0.08 sec.
2025-11-14 15:55:28,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,441 - INFO - Going to convert document batch...
2025-11-14 15:55:28,442 - INFO - Processing document 4_2023-10-10
2025-11-14 15:55:28,478 - INFO - Finished converting document 4_2023-10-10 in 0.06 sec.
2025-11-14 15:55:28,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,565 - INFO - Going to convert document batch...
2025-11-14 15:55:28,566 - INFO - Processing document 4_2023-10-17
2025-11-14 15:55:28,597 - INFO - Finished converting document 4_2023-10-17 in 0.08 sec.


Converted 'data\edgar_documents\CHTR\4_2023-10-05' --> 'data\processed_data\CHTR\4_2023-10-05.md'
Converted 'data\edgar_documents\CHTR\4_2023-10-10' --> 'data\processed_data\CHTR\4_2023-10-10.md'


2025-11-14 15:55:28,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,729 - INFO - Going to convert document batch...
2025-11-14 15:55:28,732 - INFO - Processing document 4_2023-11-02


Converted 'data\edgar_documents\CHTR\4_2023-10-17' --> 'data\processed_data\CHTR\4_2023-10-17.md'


2025-11-14 15:55:28,887 - INFO - Finished converting document 4_2023-11-02 in 0.27 sec.
2025-11-14 15:55:28,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,016 - INFO - Going to convert document batch...
2025-11-14 15:55:29,018 - INFO - Processing document 4_2023-11-06
2025-11-14 15:55:29,060 - INFO - Finished converting document 4_2023-11-06 in 0.08 sec.
2025-11-14 15:55:29,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,147 - INFO - Going to convert document batch...
2025-11-14 15:55:29,148 - INFO - Processing document 4_2023-11-08
2025-11-14 15:55:29,181 - INFO - Finished converting document 4_2023-11-08 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2023-11-02' --> 'data\processed_data\CHTR\4_2023-11-02.md'
Converted 'data\edgar_documents\CHTR\4_2023-11-06' --> 'data\processed_data\CHTR\4_2023-11-06.md'


2025-11-14 15:55:29,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,245 - INFO - Going to convert document batch...
2025-11-14 15:55:29,246 - INFO - Processing document 4_2023-11-15
2025-11-14 15:55:29,277 - INFO - Finished converting document 4_2023-11-15 in 0.06 sec.
2025-11-14 15:55:29,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,354 - INFO - Going to convert document batch...
2025-11-14 15:55:29,355 - INFO - Processing document 4_2023-11-16


Converted 'data\edgar_documents\CHTR\4_2023-11-08' --> 'data\processed_data\CHTR\4_2023-11-08.md'
Converted 'data\edgar_documents\CHTR\4_2023-11-15' --> 'data\processed_data\CHTR\4_2023-11-15.md'


2025-11-14 15:55:29,448 - INFO - Finished converting document 4_2023-11-16 in 0.14 sec.
2025-11-14 15:55:29,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,573 - INFO - Going to convert document batch...
2025-11-14 15:55:29,574 - INFO - Processing document 4_2023-11-20
2025-11-14 15:55:29,668 - INFO - Finished converting document 4_2023-11-20 in 0.16 sec.


Converted 'data\edgar_documents\CHTR\4_2023-11-16' --> 'data\processed_data\CHTR\4_2023-11-16.md'


2025-11-14 15:55:29,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,823 - INFO - Going to convert document batch...
2025-11-14 15:55:29,824 - INFO - Processing document 4_2023-11-21
2025-11-14 15:55:29,892 - INFO - Finished converting document 4_2023-11-21 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2023-11-20' --> 'data\processed_data\CHTR\4_2023-11-20.md'
Converted 'data\edgar_documents\CHTR\4_2023-11-21' --> 'data\processed_data\CHTR\4_2023-11-21.md'


2025-11-14 15:55:29,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,010 - INFO - Going to convert document batch...
2025-11-14 15:55:30,011 - INFO - Processing document 4_2023-12-04
2025-11-14 15:55:30,078 - INFO - Finished converting document 4_2023-12-04 in 0.12 sec.
2025-11-14 15:55:30,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,182 - INFO - Going to convert document batch...
2025-11-14 15:55:30,183 - INFO - Processing document 4_2023-12-07
2025-11-14 15:55:30,219 - INFO - Finished converting document 4_2023-12-07 in 0.08 sec.
2025-11-14 15:55:30,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,302 - INFO - Going to convert document batch...
2025-11-14 15:55:30,303 - INFO - Processing document 4_2023-12-15
2025-11-14 15:55:30,340 - INFO - Finished converting document 4_2023-12-15 in 0.09 sec.


Converted 'data\edgar_documents\CHTR\4_2023-12-04' --> 'data\processed_data\CHTR\4_2023-12-04.md'
Converted 'data\edgar_documents\CHTR\4_2023-12-07' --> 'data\processed_data\CHTR\4_2023-12-07.md'


2025-11-14 15:55:30,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,416 - INFO - Going to convert document batch...
2025-11-14 15:55:30,417 - INFO - Processing document 4_2024-01-05
2025-11-14 15:55:30,464 - INFO - Finished converting document 4_2024-01-05 in 0.09 sec.
2025-11-14 15:55:30,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,589 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2023-12-15' --> 'data\processed_data\CHTR\4_2023-12-15.md'
Converted 'data\edgar_documents\CHTR\4_2024-01-05' --> 'data\processed_data\CHTR\4_2024-01-05.md'


2025-11-14 15:55:30,590 - INFO - Processing document 4_2024-01-17
2025-11-14 15:55:30,655 - INFO - Finished converting document 4_2024-01-17 in 0.16 sec.
2025-11-14 15:55:30,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,774 - INFO - Going to convert document batch...
2025-11-14 15:55:30,775 - INFO - Processing document 4_2024-01-23
2025-11-14 15:55:30,812 - INFO - Finished converting document 4_2024-01-23 in 0.06 sec.
2025-11-14 15:55:30,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,875 - INFO - Going to convert document batch...
2025-11-14 15:55:30,876 - INFO - Processing document 4_2024-02-06
2025-11-14 15:55:30,911 - INFO - Finished converting document 4_2024-02-06 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2024-01-17' --> 'data\processed_data\CHTR\4_2024-01-17.md'
Converted 'data\edgar_documents\CHTR\4_2024-01-23' --> 'data\processed_data\CHTR\4_2024-01-23.md'
Converted 'data\edgar_documents\CHTR\4_2024-02-06' --> 'data\processed_data\CHTR\4_2024-02-06.md'


2025-11-14 15:55:30,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,015 - INFO - Going to convert document batch...
2025-11-14 15:55:31,016 - INFO - Processing document 4_2024-02-07
2025-11-14 15:55:31,058 - INFO - Finished converting document 4_2024-02-07 in 0.11 sec.
2025-11-14 15:55:31,108 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,129 - INFO - Going to convert document batch...
2025-11-14 15:55:31,131 - INFO - Processing document 4_2024-03-01
2025-11-14 15:55:31,164 - INFO - Finished converting document 4_2024-03-01 in 0.06 sec.
2025-11-14 15:55:31,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,224 - INFO - Going to convert document batch...
2025-11-14 15:55:31,225 - INFO - Processing document 4_2024-03-06
2025-11-14 15:55:31,259 - INFO - Finished converting document 4_2024-03-06 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2024-02-07' --> 'data\processed_data\CHTR\4_2024-02-07.md'
Converted 'data\edgar_documents\CHTR\4_2024-03-01' --> 'data\processed_data\CHTR\4_2024-03-01.md'
Converted 'data\edgar_documents\CHTR\4_2024-03-06' --> 'data\processed_data\CHTR\4_2024-03-06.md'


2025-11-14 15:55:31,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,362 - INFO - Going to convert document batch...
2025-11-14 15:55:31,363 - INFO - Processing document 4_2024-04-05
2025-11-14 15:55:31,461 - INFO - Finished converting document 4_2024-04-05 in 0.16 sec.
2025-11-14 15:55:31,540 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,554 - INFO - Going to convert document batch...
2025-11-14 15:55:31,555 - INFO - Processing document 4_2024-04-25
2025-11-14 15:55:31,590 - INFO - Finished converting document 4_2024-04-25 in 0.08 sec.
2025-11-14 15:55:31,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,668 - INFO - Going to convert document batch...
2025-11-14 15:55:31,669 - INFO - Processing document 4_2024-05-06
2025-11-14 15:55:31,705 - INFO - Finished converting document 4_2024-05-06 in 0.08 sec.


Converted 'data\edgar_documents\CHTR\4_2024-04-05' --> 'data\processed_data\CHTR\4_2024-04-05.md'
Converted 'data\edgar_documents\CHTR\4_2024-04-25' --> 'data\processed_data\CHTR\4_2024-04-25.md'


2025-11-14 15:55:31,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,777 - INFO - Going to convert document batch...
2025-11-14 15:55:31,778 - INFO - Processing document 4_2024-06-10
2025-11-14 15:55:31,818 - INFO - Finished converting document 4_2024-06-10 in 0.08 sec.
2025-11-14 15:55:31,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,903 - INFO - Going to convert document batch...
2025-11-14 15:55:31,904 - INFO - Processing document 4_2024-06-14


Converted 'data\edgar_documents\CHTR\4_2024-05-06' --> 'data\processed_data\CHTR\4_2024-05-06.md'
Converted 'data\edgar_documents\CHTR\4_2024-06-10' --> 'data\processed_data\CHTR\4_2024-06-10.md'


2025-11-14 15:55:31,947 - INFO - Finished converting document 4_2024-06-14 in 0.08 sec.
2025-11-14 15:55:32,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,024 - INFO - Going to convert document batch...
2025-11-14 15:55:32,025 - INFO - Processing document 4_2024-06-17
2025-11-14 15:55:32,058 - INFO - Finished converting document 4_2024-06-17 in 0.08 sec.
2025-11-14 15:55:32,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,121 - INFO - Going to convert document batch...
2025-11-14 15:55:32,122 - INFO - Processing document 4_2024-06-25
2025-11-14 15:55:32,161 - INFO - Finished converting document 4_2024-06-25 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2024-06-14' --> 'data\processed_data\CHTR\4_2024-06-14.md'
Converted 'data\edgar_documents\CHTR\4_2024-06-17' --> 'data\processed_data\CHTR\4_2024-06-17.md'


2025-11-14 15:55:32,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,246 - INFO - Going to convert document batch...
2025-11-14 15:55:32,247 - INFO - Processing document 4_2024-07-02
2025-11-14 15:55:32,295 - INFO - Finished converting document 4_2024-07-02 in 0.09 sec.


Converted 'data\edgar_documents\CHTR\4_2024-06-25' --> 'data\processed_data\CHTR\4_2024-06-25.md'
Converted 'data\edgar_documents\CHTR\4_2024-07-02' --> 'data\processed_data\CHTR\4_2024-07-02.md'


2025-11-14 15:55:32,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,431 - INFO - Going to convert document batch...
2025-11-14 15:55:32,433 - INFO - Processing document 4_2024-07-08
2025-11-14 15:55:32,465 - INFO - Finished converting document 4_2024-07-08 in 0.08 sec.
2025-11-14 15:55:32,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,540 - INFO - Going to convert document batch...
2025-11-14 15:55:32,541 - INFO - Processing document 4_2024-07-16
2025-11-14 15:55:33,147 - INFO - Finished converting document 4_2024-07-16 in 0.64 sec.


Converted 'data\edgar_documents\CHTR\4_2024-07-08' --> 'data\processed_data\CHTR\4_2024-07-08.md'


2025-11-14 15:55:33,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,222 - INFO - Going to convert document batch...
2025-11-14 15:55:33,223 - INFO - Processing document 4_2024-07-17
2025-11-14 15:55:33,268 - INFO - Finished converting document 4_2024-07-17 in 0.08 sec.
2025-11-14 15:55:33,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,358 - INFO - Going to convert document batch...
2025-11-14 15:55:33,359 - INFO - Processing document 4_2024-07-26


Converted 'data\edgar_documents\CHTR\4_2024-07-16' --> 'data\processed_data\CHTR\4_2024-07-16.md'
Converted 'data\edgar_documents\CHTR\4_2024-07-17' --> 'data\processed_data\CHTR\4_2024-07-17.md'


2025-11-14 15:55:33,438 - INFO - Finished converting document 4_2024-07-26 in 0.12 sec.
2025-11-14 15:55:33,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,559 - INFO - Going to convert document batch...
2025-11-14 15:55:33,561 - INFO - Processing document 4_2024-07-30
2025-11-14 15:55:33,635 - INFO - Finished converting document 4_2024-07-30 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2024-07-26' --> 'data\processed_data\CHTR\4_2024-07-26.md'
Converted 'data\edgar_documents\CHTR\4_2024-07-30' --> 'data\processed_data\CHTR\4_2024-07-30.md'


2025-11-14 15:55:33,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,733 - INFO - Going to convert document batch...
2025-11-14 15:55:33,734 - INFO - Processing document 4_2024-08-07
2025-11-14 15:55:33,773 - INFO - Finished converting document 4_2024-08-07 in 0.08 sec.
2025-11-14 15:55:33,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,838 - INFO - Going to convert document batch...
2025-11-14 15:55:33,840 - INFO - Processing document 4_2024-08-15
2025-11-14 15:55:33,880 - INFO - Finished converting document 4_2024-08-15 in 0.06 sec.
2025-11-14 15:55:33,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,959 - INFO - Going to convert document batch...
2025-11-14 15:55:33,961 - INFO - Processing document 4_2024-09-13
2025-11-14 15:55:33,999 - INFO - Finished converting document 4_2024-09-13 in 0.09 sec.


Converted 'data\edgar_documents\CHTR\4_2024-08-07' --> 'data\processed_data\CHTR\4_2024-08-07.md'
Converted 'data\edgar_documents\CHTR\4_2024-08-15' --> 'data\processed_data\CHTR\4_2024-08-15.md'


2025-11-14 15:55:34,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:34,064 - INFO - Going to convert document batch...
2025-11-14 15:55:34,065 - INFO - Processing document 4_2024-09-17
2025-11-14 15:55:34,098 - INFO - Finished converting document 4_2024-09-17 in 0.06 sec.
2025-11-14 15:55:34,145 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:34,146 - ERROR - Input document 4_2024-09-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55

Converted 'data\edgar_documents\CHTR\4_2024-09-13' --> 'data\processed_data\CHTR\4_2024-09-13.md'
Converted 'data\edgar_documents\CHTR\4_2024-09-17' --> 'data\processed_data\CHTR\4_2024-09-17.md'
Error processing data\edgar_documents\CHTR\4_2024-09-23: File format not allowed: data\edgar_documents\CHTR\4_2024-09-23


2025-11-14 15:55:34,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:34,294 - INFO - Going to convert document batch...
2025-11-14 15:55:34,295 - INFO - Processing document 4_2024-10-15
2025-11-14 15:55:34,333 - INFO - Finished converting document 4_2024-10-15 in 0.08 sec.
2025-11-14 15:55:34,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:34,394 - INFO - Going to convert document batch...
2025-11-14 15:55:34,396 - INFO - Processing document 4_2024-10-22


Converted 'data\edgar_documents\CHTR\4_2024-10-09' --> 'data\processed_data\CHTR\4_2024-10-09.md'
Converted 'data\edgar_documents\CHTR\4_2024-10-15' --> 'data\processed_data\CHTR\4_2024-10-15.md'


2025-11-14 15:55:34,476 - INFO - Finished converting document 4_2024-10-22 in 0.11 sec.
2025-11-14 15:55:34,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:34,589 - INFO - Going to convert document batch...
2025-11-14 15:55:34,590 - INFO - Processing document 4_2024-11-07
2025-11-14 15:55:34,657 - INFO - Finished converting document 4_2024-11-07 in 0.12 sec.


Converted 'data\edgar_documents\CHTR\4_2024-10-22' --> 'data\processed_data\CHTR\4_2024-10-22.md'
Converted 'data\edgar_documents\CHTR\4_2024-11-07' --> 'data\processed_data\CHTR\4_2024-11-07.md'


2025-11-14 15:55:34,754 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:34,755 - ERROR - Input document 4_2024-11-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:34,757 - INFO - Going to convert document batch...
2025-11-14 15:55:34,774 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:34,775 - ERROR - Input document 4_2024-11-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\CHTR\4_2024-11-13: File format not allowed: data\edgar_documents\CHTR\4_2024-11-13
Error processing data\edgar_documents\CHTR\4_2024-11-14: File format not allowed: data\edgar_documents\CHTR\4_2024-11-14
Converted 'data\edgar_documents\CHTR\4_2024-11-18' --> 'data\processed_data\CHTR\4_2024-11-18.md'
Error processing data\edgar_documents\CHTR\4_2024-11-20: File format not allowed: data\edgar_documents\CHTR\4_2024-11-20


2025-11-14 15:55:34,963 - INFO - Going to convert document batch...
2025-11-14 15:55:34,964 - INFO - Processing document 4_2024-12-05
2025-11-14 15:55:35,003 - INFO - Finished converting document 4_2024-12-05 in 0.08 sec.
2025-11-14 15:55:35,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,069 - INFO - Going to convert document batch...
2025-11-14 15:55:35,070 - INFO - Processing document 4_2024-12-13
2025-11-14 15:55:35,116 - INFO - Finished converting document 4_2024-12-13 in 0.08 sec.
2025-11-14 15:55:35,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,206 - INFO - Going to convert document batch...
2025-11-14 15:55:35,210 - INFO - Processing document 4_2025-01-08


Converted 'data\edgar_documents\CHTR\4_2024-12-05' --> 'data\processed_data\CHTR\4_2024-12-05.md'
Converted 'data\edgar_documents\CHTR\4_2024-12-13' --> 'data\processed_data\CHTR\4_2024-12-13.md'


2025-11-14 15:55:35,253 - INFO - Finished converting document 4_2025-01-08 in 0.09 sec.
2025-11-14 15:55:35,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,328 - INFO - Going to convert document batch...
2025-11-14 15:55:35,329 - INFO - Processing document 4_2025-01-14
2025-11-14 15:55:35,371 - INFO - Finished converting document 4_2025-01-14 in 0.08 sec.
2025-11-14 15:55:35,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,479 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2025-01-08' --> 'data\processed_data\CHTR\4_2025-01-08.md'
Converted 'data\edgar_documents\CHTR\4_2025-01-14' --> 'data\processed_data\CHTR\4_2025-01-14.md'


2025-11-14 15:55:35,481 - INFO - Processing document 4_2025-01-17
2025-11-14 15:55:35,542 - INFO - Finished converting document 4_2025-01-17 in 0.12 sec.
2025-11-14 15:55:35,595 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:35,596 - ERROR - Input document 4_2025-01-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:35,598 - INFO - Going to convert document batch...
2025-11-14 15:55:35,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55

Converted 'data\edgar_documents\CHTR\4_2025-01-17' --> 'data\processed_data\CHTR\4_2025-01-17.md'
Error processing data\edgar_documents\CHTR\4_2025-01-22: File format not allowed: data\edgar_documents\CHTR\4_2025-01-22
Converted 'data\edgar_documents\CHTR\4_2025-02-07' --> 'data\processed_data\CHTR\4_2025-02-07.md'


2025-11-14 15:55:35,779 - ERROR - Input document 4_2025-02-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:35,782 - INFO - Going to convert document batch...
2025-11-14 15:55:35,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,828 - INFO - Going to convert document batch...
2025-11-14 15:55:35,830 - INFO - Processing document 4_2025-03-10
2025-11-14 15:55:35,895 - INFO - Finished converting document 4_2025-03-10 in 0.11 sec.
2025-11-14 15:55:35,971 - INFO - detec

Error processing data\edgar_documents\CHTR\4_2025-02-19: File format not allowed: data\edgar_documents\CHTR\4_2025-02-19
Converted 'data\edgar_documents\CHTR\4_2025-03-10' --> 'data\processed_data\CHTR\4_2025-03-10.md'


2025-11-14 15:55:36,001 - INFO - Going to convert document batch...
2025-11-14 15:55:36,004 - INFO - Processing document 4_2025-03-13
2025-11-14 15:55:36,051 - INFO - Finished converting document 4_2025-03-13 in 0.09 sec.
2025-11-14 15:55:36,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,127 - INFO - Going to convert document batch...
2025-11-14 15:55:36,128 - INFO - Processing document 4_2025-03-20
2025-11-14 15:55:36,170 - INFO - Finished converting document 4_2025-03-20 in 0.08 sec.
2025-11-14 15:55:36,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,238 - INFO - Going to convert document batch...
2025-11-14 15:55:36,239 - INFO - Processing document 4_2025-03-26
2025-11-14 15:55:36,274 - INFO - Finished converting document 4_2025-03-26 in 0.05 sec.


Converted 'data\edgar_documents\CHTR\4_2025-03-13' --> 'data\processed_data\CHTR\4_2025-03-13.md'
Converted 'data\edgar_documents\CHTR\4_2025-03-20' --> 'data\processed_data\CHTR\4_2025-03-20.md'


2025-11-14 15:55:36,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,368 - INFO - Going to convert document batch...
2025-11-14 15:55:36,369 - INFO - Processing document 4_2025-04-01
2025-11-14 15:55:36,437 - INFO - Finished converting document 4_2025-04-01 in 0.11 sec.
2025-11-14 15:55:36,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2025-03-26' --> 'data\processed_data\CHTR\4_2025-03-26.md'
Converted 'data\edgar_documents\CHTR\4_2025-04-01' --> 'data\processed_data\CHTR\4_2025-04-01.md'


2025-11-14 15:55:36,541 - INFO - Going to convert document batch...
2025-11-14 15:55:36,543 - INFO - Processing document 4_2025-04-04
2025-11-14 15:55:36,588 - INFO - Finished converting document 4_2025-04-04 in 0.09 sec.
2025-11-14 15:55:36,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,652 - INFO - Going to convert document batch...
2025-11-14 15:55:36,653 - INFO - Processing document 4_2025-04-11
2025-11-14 15:55:36,691 - INFO - Finished converting document 4_2025-04-11 in 0.06 sec.
2025-11-14 15:55:36,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,794 - INFO - Going to convert document batch...
2025-11-14 15:55:36,796 - INFO - Processing document 4_2025-04-24


Converted 'data\edgar_documents\CHTR\4_2025-04-04' --> 'data\processed_data\CHTR\4_2025-04-04.md'
Converted 'data\edgar_documents\CHTR\4_2025-04-11' --> 'data\processed_data\CHTR\4_2025-04-11.md'


2025-11-14 15:55:36,848 - INFO - Finished converting document 4_2025-04-24 in 0.11 sec.
2025-11-14 15:55:36,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,950 - INFO - Going to convert document batch...
2025-11-14 15:55:36,951 - INFO - Processing document 4_2025-05-07
2025-11-14 15:55:37,002 - INFO - Finished converting document 4_2025-05-07 in 0.09 sec.
2025-11-14 15:55:37,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,080 - INFO - Going to convert document batch...
2025-11-14 15:55:37,082 - INFO - Processing document 4_2025-05-13


Converted 'data\edgar_documents\CHTR\4_2025-04-24' --> 'data\processed_data\CHTR\4_2025-04-24.md'
Converted 'data\edgar_documents\CHTR\4_2025-05-07' --> 'data\processed_data\CHTR\4_2025-05-07.md'


2025-11-14 15:55:37,144 - INFO - Finished converting document 4_2025-05-13 in 0.09 sec.
2025-11-14 15:55:37,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,222 - INFO - Going to convert document batch...
2025-11-14 15:55:37,223 - INFO - Processing document 4_2025-05-20
2025-11-14 15:55:37,285 - INFO - Finished converting document 4_2025-05-20 in 0.09 sec.
2025-11-14 15:55:37,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,373 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2025-05-13' --> 'data\processed_data\CHTR\4_2025-05-13.md'
Converted 'data\edgar_documents\CHTR\4_2025-05-20' --> 'data\processed_data\CHTR\4_2025-05-20.md'


2025-11-14 15:55:37,375 - INFO - Processing document 4_2025-06-10
2025-11-14 15:55:37,434 - INFO - Finished converting document 4_2025-06-10 in 0.09 sec.
2025-11-14 15:55:37,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,531 - INFO - Going to convert document batch...
2025-11-14 15:55:37,532 - INFO - Processing document 4_2025-06-12
2025-11-14 15:55:37,574 - INFO - Finished converting document 4_2025-06-12 in 0.08 sec.
2025-11-14 15:55:37,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,716 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2025-06-10' --> 'data\processed_data\CHTR\4_2025-06-10.md'
Converted 'data\edgar_documents\CHTR\4_2025-06-12' --> 'data\processed_data\CHTR\4_2025-06-12.md'


2025-11-14 15:55:37,718 - INFO - Processing document 4_2025-06-20
2025-11-14 15:55:37,853 - INFO - Finished converting document 4_2025-06-20 in 0.22 sec.
2025-11-14 15:55:37,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,003 - INFO - Going to convert document batch...
2025-11-14 15:55:38,006 - INFO - Processing document 4_2025-07-03


Converted 'data\edgar_documents\CHTR\4_2025-06-20' --> 'data\processed_data\CHTR\4_2025-06-20.md'


2025-11-14 15:55:38,119 - INFO - Finished converting document 4_2025-07-03 in 0.19 sec.
2025-11-14 15:55:38,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,221 - INFO - Going to convert document batch...
2025-11-14 15:55:38,222 - INFO - Processing document 4_2025-07-08
2025-11-14 15:55:38,267 - INFO - Finished converting document 4_2025-07-08 in 0.08 sec.
2025-11-14 15:55:38,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2025-07-03' --> 'data\processed_data\CHTR\4_2025-07-03.md'
Converted 'data\edgar_documents\CHTR\4_2025-07-08' --> 'data\processed_data\CHTR\4_2025-07-08.md'


2025-11-14 15:55:38,382 - INFO - Going to convert document batch...
2025-11-14 15:55:38,385 - INFO - Processing document 4_2025-07-15
2025-11-14 15:55:38,465 - INFO - Finished converting document 4_2025-07-15 in 0.14 sec.
2025-11-14 15:55:38,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,570 - INFO - Going to convert document batch...
2025-11-14 15:55:38,572 - INFO - Processing document 4_2025-07-29
2025-11-14 15:55:38,639 - INFO - Finished converting document 4_2025-07-29 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2025-07-15' --> 'data\processed_data\CHTR\4_2025-07-15.md'


2025-11-14 15:55:38,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,742 - INFO - Going to convert document batch...
2025-11-14 15:55:38,744 - INFO - Processing document 4_2025-07-31
2025-11-14 15:55:38,803 - INFO - Finished converting document 4_2025-07-31 in 0.09 sec.
2025-11-14 15:55:38,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,888 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2025-07-29' --> 'data\processed_data\CHTR\4_2025-07-29.md'
Converted 'data\edgar_documents\CHTR\4_2025-07-31' --> 'data\processed_data\CHTR\4_2025-07-31.md'


2025-11-14 15:55:38,890 - INFO - Processing document 4_2025-08-04
2025-11-14 15:55:38,950 - INFO - Finished converting document 4_2025-08-04 in 0.11 sec.
2025-11-14 15:55:39,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,065 - INFO - Going to convert document batch...
2025-11-14 15:55:39,067 - INFO - Processing document 4_2025-08-05
2025-11-14 15:55:39,130 - INFO - Finished converting document 4_2025-08-05 in 0.12 sec.


Converted 'data\edgar_documents\CHTR\4_2025-08-04' --> 'data\processed_data\CHTR\4_2025-08-04.md'
Converted 'data\edgar_documents\CHTR\4_2025-08-05' --> 'data\processed_data\CHTR\4_2025-08-05.md'


2025-11-14 15:55:39,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,230 - INFO - Going to convert document batch...
2025-11-14 15:55:39,231 - INFO - Processing document 4_2025-08-07
2025-11-14 15:55:39,307 - INFO - Finished converting document 4_2025-08-07 in 0.12 sec.
2025-11-14 15:55:39,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,407 - INFO - Going to convert document batch...
2025-11-14 15:55:39,409 - INFO - Processing document 4_2025-08-13
2025-11-14 15:55:39,461 - INFO - Finished converting document 4_2025-08-13 in 0.08 sec.


Converted 'data\edgar_documents\CHTR\4_2025-08-07' --> 'data\processed_data\CHTR\4_2025-08-07.md'
Converted 'data\edgar_documents\CHTR\4_2025-08-13' --> 'data\processed_data\CHTR\4_2025-08-13.md'


2025-11-14 15:55:39,557 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:39,560 - ERROR - Input document 4_2025-08-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:39,562 - INFO - Going to convert document batch...
2025-11-14 15:55:39,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,619 - INFO - Going to convert document batch...
2025-11-14 15:55:39,621 - INFO - Processing document 4_2025-09-12
2025-11-14 15:55:39,682 - INFO - Fin

Error processing data\edgar_documents\CHTR\4_2025-08-18: File format not allowed: data\edgar_documents\CHTR\4_2025-08-18
Converted 'data\edgar_documents\CHTR\4_2025-09-12' --> 'data\processed_data\CHTR\4_2025-09-12.md'


2025-11-14 15:55:39,808 - INFO - Going to convert document batch...
2025-11-14 15:55:39,811 - INFO - Processing document 4_2025-09-23
2025-11-14 15:55:39,887 - INFO - Finished converting document 4_2025-09-23 in 0.16 sec.
2025-11-14 15:55:39,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,983 - INFO - Going to convert document batch...
2025-11-14 15:55:39,985 - INFO - Processing document 4_2025-10-14
2025-11-14 15:55:40,027 - INFO - Finished converting document 4_2025-10-14 in 0.11 sec.


Converted 'data\edgar_documents\CHTR\4_2025-09-23' --> 'data\processed_data\CHTR\4_2025-09-23.md'
Converted 'data\edgar_documents\CHTR\4_2025-10-14' --> 'data\processed_data\CHTR\4_2025-10-14.md'


2025-11-14 15:55:40,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:40,130 - INFO - Going to convert document batch...
2025-11-14 15:55:40,132 - INFO - Processing document 4_2025-11-07
2025-11-14 15:55:40,188 - INFO - Finished converting document 4_2025-11-07 in 0.12 sec.
2025-11-14 15:55:40,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:40,333 - INFO - Going to convert document batch...
2025-11-14 15:55:40,335 - INFO - Processing document 8-K_2023-01-27
2025-11-14 15:55:40,374 - INFO - Finished converting document 8-K_2023-01-27 in 0.09 sec.
2025-11-14 15:55:40,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2025-11-07' --> 'data\processed_data\CHTR\4_2025-11-07.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-01-27' --> 'data\processed_data\CHTR\8-K_2023-01-27.md'


2025-11-14 15:55:40,521 - INFO - Going to convert document batch...
2025-11-14 15:55:40,522 - INFO - Processing document 8-K_2023-02-16
2025-11-14 15:55:40,636 - INFO - Finished converting document 8-K_2023-02-16 in 0.23 sec.
2025-11-14 15:55:40,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:40,848 - INFO - Going to convert document batch...
2025-11-14 15:55:40,850 - INFO - Processing document 8-K_2023-02-24


Converted 'data\edgar_documents\CHTR\8-K_2023-02-16' --> 'data\processed_data\CHTR\8-K_2023-02-16.md'


2025-11-14 15:55:40,945 - INFO - Finished converting document 8-K_2023-02-24 in 0.22 sec.
2025-11-14 15:55:41,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:41,086 - INFO - Going to convert document batch...
2025-11-14 15:55:41,088 - INFO - Processing document 8-K_2023-03-29


Converted 'data\edgar_documents\CHTR\8-K_2023-02-24' --> 'data\processed_data\CHTR\8-K_2023-02-24.md'


2025-11-14 15:55:41,636 - INFO - Finished converting document 8-K_2023-03-29 in 0.64 sec.
2025-11-14 15:55:41,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:41,767 - INFO - Going to convert document batch...
2025-11-14 15:55:41,768 - INFO - Processing document 8-K_2023-04-06
2025-11-14 15:55:41,830 - INFO - Finished converting document 8-K_2023-04-06 in 0.14 sec.
2025-11-14 15:55:41,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-03-29' --> 'data\processed_data\CHTR\8-K_2023-03-29.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-04-06' --> 'data\processed_data\CHTR\8-K_2023-04-06.md'


2025-11-14 15:55:41,933 - INFO - Going to convert document batch...
2025-11-14 15:55:41,935 - INFO - Processing document 8-K_2023-04-21
2025-11-14 15:55:41,991 - INFO - Finished converting document 8-K_2023-04-21 in 0.14 sec.
2025-11-14 15:55:42,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:42,116 - INFO - Going to convert document batch...
2025-11-14 15:55:42,118 - INFO - Processing document 8-K_2023-04-28
2025-11-14 15:55:42,161 - INFO - Finished converting document 8-K_2023-04-28 in 0.12 sec.


Converted 'data\edgar_documents\CHTR\8-K_2023-04-21' --> 'data\processed_data\CHTR\8-K_2023-04-21.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-04-28' --> 'data\processed_data\CHTR\8-K_2023-04-28.md'


2025-11-14 15:55:42,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:42,273 - INFO - Going to convert document batch...
2025-11-14 15:55:42,274 - INFO - Processing document 8-K_2023-05-01
2025-11-14 15:55:42,343 - INFO - Finished converting document 8-K_2023-05-01 in 0.16 sec.
2025-11-14 15:55:42,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:42,444 - INFO - Going to convert document batch...
2025-11-14 15:55:42,445 - INFO - Processing document 8-K_2023-06-29
2025-11-14 15:55:42,480 - INFO - Finished converting document 8-K_2023-06-29 in 0.11 sec.
2025-11-14 15:55:42,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-05-01' --> 'data\processed_data\CHTR\8-K_2023-05-01.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-06-29' --> 'data\processed_data\CHTR\8-K_2023-06-29.md'


2025-11-14 15:55:42,580 - INFO - Going to convert document batch...
2025-11-14 15:55:42,582 - INFO - Processing document 8-K_2023-07-28
2025-11-14 15:55:42,619 - INFO - Finished converting document 8-K_2023-07-28 in 0.11 sec.
2025-11-14 15:55:42,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:42,695 - INFO - Going to convert document batch...
2025-11-14 15:55:42,696 - INFO - Processing document 8-K_2023-08-21
2025-11-14 15:55:42,729 - INFO - Finished converting document 8-K_2023-08-21 in 0.06 sec.
2025-11-14 15:55:42,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-07-28' --> 'data\processed_data\CHTR\8-K_2023-07-28.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-08-21' --> 'data\processed_data\CHTR\8-K_2023-08-21.md'


2025-11-14 15:55:42,847 - INFO - Going to convert document batch...
2025-11-14 15:55:42,850 - INFO - Processing document 8-K_2023-09-01
2025-11-14 15:55:42,920 - INFO - Finished converting document 8-K_2023-09-01 in 0.17 sec.
2025-11-14 15:55:42,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:43,027 - INFO - Going to convert document batch...
2025-11-14 15:55:43,028 - INFO - Processing document 8-K_2023-09-11
2025-11-14 15:55:43,067 - INFO - Finished converting document 8-K_2023-09-11 in 0.11 sec.
2025-11-14 15:55:43,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-09-01' --> 'data\processed_data\CHTR\8-K_2023-09-01.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-09-11' --> 'data\processed_data\CHTR\8-K_2023-09-11.md'


2025-11-14 15:55:43,181 - INFO - Going to convert document batch...
2025-11-14 15:55:43,182 - INFO - Processing document 8-K_2023-10-25
2025-11-14 15:55:43,226 - INFO - Finished converting document 8-K_2023-10-25 in 0.12 sec.
2025-11-14 15:55:43,296 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:43,322 - INFO - Going to convert document batch...
2025-11-14 15:55:43,323 - INFO - Processing document 8-K_2023-10-27
2025-11-14 15:55:43,360 - INFO - Finished converting document 8-K_2023-10-27 in 0.11 sec.
2025-11-14 15:55:43,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-10-25' --> 'data\processed_data\CHTR\8-K_2023-10-25.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-10-27' --> 'data\processed_data\CHTR\8-K_2023-10-27.md'


2025-11-14 15:55:43,471 - INFO - Going to convert document batch...
2025-11-14 15:55:43,472 - INFO - Processing document 8-K_2023-11-13
2025-11-14 15:55:43,574 - INFO - Finished converting document 8-K_2023-11-13 in 0.19 sec.
2025-11-14 15:55:43,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:43,720 - INFO - Going to convert document batch...
2025-11-14 15:55:43,721 - INFO - Processing document 8-K_2023-12-13


Converted 'data\edgar_documents\CHTR\8-K_2023-11-13' --> 'data\processed_data\CHTR\8-K_2023-11-13.md'


2025-11-14 15:55:43,822 - INFO - Finished converting document 8-K_2023-12-13 in 0.17 sec.
2025-11-14 15:55:43,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:43,963 - INFO - Going to convert document batch...
2025-11-14 15:55:43,966 - INFO - Processing document 8-K_2024-02-02
2025-11-14 15:55:44,025 - INFO - Finished converting document 8-K_2024-02-02 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\8-K_2023-12-13' --> 'data\processed_data\CHTR\8-K_2023-12-13.md'


2025-11-14 15:55:44,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:44,165 - INFO - Going to convert document batch...
2025-11-14 15:55:44,166 - INFO - Processing document 8-K_2024-02-05
2025-11-14 15:55:44,208 - INFO - Finished converting document 8-K_2024-02-05 in 0.12 sec.
2025-11-14 15:55:44,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2024-02-02' --> 'data\processed_data\CHTR\8-K_2024-02-02.md'
Converted 'data\edgar_documents\CHTR\8-K_2024-02-05' --> 'data\processed_data\CHTR\8-K_2024-02-05.md'


2025-11-14 15:55:44,361 - INFO - Going to convert document batch...
2025-11-14 15:55:44,364 - INFO - Processing document 8-K_2024-04-26
2025-11-14 15:55:44,482 - INFO - Finished converting document 8-K_2024-04-26 in 0.25 sec.
2025-11-14 15:55:44,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:44,576 - INFO - Going to convert document batch...
2025-11-14 15:55:44,577 - INFO - Processing document 8-K_2024-05-09
2025-11-14 15:55:44,643 - INFO - Finished converting document 8-K_2024-05-09 in 0.11 sec.


Converted 'data\edgar_documents\CHTR\8-K_2024-04-26' --> 'data\processed_data\CHTR\8-K_2024-04-26.md'
Converted 'data\edgar_documents\CHTR\8-K_2024-05-09' --> 'data\processed_data\CHTR\8-K_2024-05-09.md'


2025-11-14 15:55:44,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:44,807 - INFO - Going to convert document batch...
2025-11-14 15:55:44,809 - INFO - Processing document 8-K_2024-05-10
2025-11-14 15:55:44,871 - INFO - Finished converting document 8-K_2024-05-10 in 0.17 sec.
2025-11-14 15:55:44,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:44,959 - INFO - Going to convert document batch...
2025-11-14 15:55:44,960 - INFO - Processing document 8-K_2024-05-14
2025-11-14 15:55:45,076 - INFO - Finished converting document 8-K_2024-05-14 in 0.17 sec.


Converted 'data\edgar_documents\CHTR\8-K_2024-05-10' --> 'data\processed_data\CHTR\8-K_2024-05-10.md'


2025-11-14 15:55:45,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:45,222 - INFO - Going to convert document batch...
2025-11-14 15:55:45,223 - INFO - Processing document 8-K_2024-07-26
2025-11-14 15:55:45,282 - INFO - Finished converting document 8-K_2024-07-26 in 0.11 sec.
2025-11-14 15:55:45,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2024-05-14' --> 'data\processed_data\CHTR\8-K_2024-05-14.md'
Converted 'data\edgar_documents\CHTR\8-K_2024-07-26' --> 'data\processed_data\CHTR\8-K_2024-07-26.md'


2025-11-14 15:55:45,399 - INFO - Going to convert document batch...
2025-11-14 15:55:45,400 - INFO - Processing document 8-K_2024-11-01
2025-11-14 15:55:45,440 - INFO - Finished converting document 8-K_2024-11-01 in 0.12 sec.
2025-11-14 15:55:45,499 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:45,500 - ERROR - Input document 8-K_2024-11-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:45,501 - INFO - Going to convert docu

Converted 'data\edgar_documents\CHTR\8-K_2024-11-01' --> 'data\processed_data\CHTR\8-K_2024-11-01.md'
Error processing data\edgar_documents\CHTR\8-K_2024-11-13: File format not allowed: data\edgar_documents\CHTR\8-K_2024-11-13


2025-11-14 15:55:45,667 - INFO - Finished converting document 8-K_2024-12-09 in 0.17 sec.
2025-11-14 15:55:45,774 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:45,775 - ERROR - Input document 8-K_2024-12-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:45,776 - INFO - Going to convert document batch...
2025-11-14 15:55:45,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:45,829 - INFO - Going to 

Converted 'data\edgar_documents\CHTR\8-K_2024-12-09' --> 'data\processed_data\CHTR\8-K_2024-12-09.md'
Error processing data\edgar_documents\CHTR\8-K_2024-12-13: File format not allowed: data\edgar_documents\CHTR\8-K_2024-12-13
Converted 'data\edgar_documents\CHTR\8-K_2025-01-31' --> 'data\processed_data\CHTR\8-K_2025-01-31.md'


2025-11-14 15:55:45,932 - ERROR - Input document 8-K_2025-02-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:45,934 - INFO - Going to convert document batch...
2025-11-14 15:55:45,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:45,984 - INFO - Going to convert document batch...
2025-11-14 15:55:45,985 - INFO - Processing document 8-K_2025-02-27
2025-11-14 15:55:46,041 - INFO - Finished converting document 8-K_2025-02-27 in 0.11 sec.
2025-11-14 15:55:46,114 - INFO -

Error processing data\edgar_documents\CHTR\8-K_2025-02-19: File format not allowed: data\edgar_documents\CHTR\8-K_2025-02-19
Converted 'data\edgar_documents\CHTR\8-K_2025-02-27' --> 'data\processed_data\CHTR\8-K_2025-02-27.md'


2025-11-14 15:55:46,158 - INFO - Going to convert document batch...
2025-11-14 15:55:46,159 - INFO - Processing document 8-K_2025-04-25
2025-11-14 15:55:46,238 - INFO - Finished converting document 8-K_2025-04-25 in 0.17 sec.
2025-11-14 15:55:46,333 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:46,335 - ERROR - Input document 8-K_2025-05-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:46,336 - INFO - Going to convert docu

Converted 'data\edgar_documents\CHTR\8-K_2025-04-25' --> 'data\processed_data\CHTR\8-K_2025-04-25.md'
Error processing data\edgar_documents\CHTR\8-K_2025-05-16: File format not allowed: data\edgar_documents\CHTR\8-K_2025-05-16
Error processing data\edgar_documents\CHTR\8-K_2025-05-19: File format not allowed: data\edgar_documents\CHTR\8-K_2025-05-19
Error processing data\edgar_documents\CHTR\8-K_2025-07-21: File format not allowed: data\edgar_documents\CHTR\8-K_2025-07-21


2025-11-14 15:55:46,449 - INFO - Processing document 8-K_2025-07-25
2025-11-14 15:55:46,487 - INFO - Finished converting document 8-K_2025-07-25 in 0.08 sec.
2025-11-14 15:55:46,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:46,570 - INFO - Going to convert document batch...
2025-11-14 15:55:46,571 - INFO - Processing document 8-K_2025-08-01
2025-11-14 15:55:46,642 - INFO - Finished converting document 8-K_2025-08-01 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\8-K_2025-07-25' --> 'data\processed_data\CHTR\8-K_2025-07-25.md'
Converted 'data\edgar_documents\CHTR\8-K_2025-08-01' --> 'data\processed_data\CHTR\8-K_2025-08-01.md'


2025-11-14 15:55:46,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:46,743 - INFO - Going to convert document batch...
2025-11-14 15:55:46,745 - INFO - Processing document 8-K_2025-08-04
2025-11-14 15:55:46,799 - INFO - Finished converting document 8-K_2025-08-04 in 0.11 sec.
2025-11-14 15:55:46,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:46,877 - INFO - Going to convert document batch...
2025-11-14 15:55:46,878 - INFO - Processing document 8-K_2025-08-05
2025-11-14 15:55:46,912 - INFO - Finished converting document 8-K_2025-08-05 in 0.08 sec.
2025-11-14 15:55:46,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2025-08-04' --> 'data\processed_data\CHTR\8-K_2025-08-04.md'
Converted 'data\edgar_documents\CHTR\8-K_2025-08-05' --> 'data\processed_data\CHTR\8-K_2025-08-05.md'


2025-11-14 15:55:47,026 - INFO - Going to convert document batch...
2025-11-14 15:55:47,027 - INFO - Processing document 8-K_2025-08-18
2025-11-14 15:55:47,136 - INFO - Finished converting document 8-K_2025-08-18 in 0.22 sec.
2025-11-14 15:55:47,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:47,313 - INFO - Going to convert document batch...
2025-11-14 15:55:47,315 - INFO - Processing document 8-K_2025-08-20


Converted 'data\edgar_documents\CHTR\8-K_2025-08-18' --> 'data\processed_data\CHTR\8-K_2025-08-18.md'


2025-11-14 15:55:47,437 - INFO - Finished converting document 8-K_2025-08-20 in 0.23 sec.
2025-11-14 15:55:47,550 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:47,609 - INFO - Going to convert document batch...
2025-11-14 15:55:47,611 - INFO - Processing document 8-K_2025-09-02


Converted 'data\edgar_documents\CHTR\8-K_2025-08-20' --> 'data\processed_data\CHTR\8-K_2025-08-20.md'


2025-11-14 15:55:47,757 - INFO - Finished converting document 8-K_2025-09-02 in 0.25 sec.
2025-11-14 15:55:47,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:47,912 - INFO - Going to convert document batch...
2025-11-14 15:55:47,913 - INFO - Processing document 8-K_2025-10-31
2025-11-14 15:55:47,951 - INFO - Finished converting document 8-K_2025-10-31 in 0.11 sec.


Converted 'data\edgar_documents\CHTR\8-K_2025-09-02' --> 'data\processed_data\CHTR\8-K_2025-09-02.md'
Converted 'data\edgar_documents\CHTR\8-K_2025-10-31' --> 'data\processed_data\CHTR\8-K_2025-10-31.md'


2025-11-14 15:55:48,064 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:48,065 - ERROR - Input document DEF-14A_2023-03-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:48,069 - INFO - Going to convert document batch...
2025-11-14 15:55:48,150 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:48,151 - ERROR - Input document DEF-14A_2024-03-14 with format No

Error processing data\edgar_documents\CHTR\DEF-14A_2023-03-16: File format not allowed: data\edgar_documents\CHTR\DEF-14A_2023-03-16
Error processing data\edgar_documents\CHTR\DEF-14A_2024-03-14: File format not allowed: data\edgar_documents\CHTR\DEF-14A_2024-03-14


2025-11-14 15:55:48,252 - ERROR - Input document DEF-14A_2025-03-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:48,254 - INFO - Going to convert document batch...
2025-11-14 15:55:48,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\CHTR\DEF-14A_2025-03-13: File format not allowed: data\edgar_documents\CHTR\DEF-14A_2025-03-13
Processed 152 new files. Errors: 16
Found 111 files to process in data\edgar_documents\CL


2025-11-14 15:55:50,782 - INFO - Going to convert document batch...
2025-11-14 15:55:50,785 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:55:50,785 - INFO - Processing document 10-K_2023-02-16
2025-11-14 15:55:56,952 - INFO - Finished converting document 10-K_2023-02-16 in 8.69 sec.
2025-11-14 15:55:58,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-K_2023-02-16' --> 'data\processed_data\CL\10-K_2023-02-16.md'


2025-11-14 15:56:00,210 - INFO - Going to convert document batch...
2025-11-14 15:56:00,212 - INFO - Processing document 10-K_2024-02-15
2025-11-14 15:56:06,165 - INFO - Finished converting document 10-K_2024-02-15 in 7.75 sec.
2025-11-14 15:56:07,422 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-K_2024-02-15' --> 'data\processed_data\CL\10-K_2024-02-15.md'


2025-11-14 15:56:08,975 - INFO - Going to convert document batch...
2025-11-14 15:56:08,977 - INFO - Processing document 10-K_2025-02-13
2025-11-14 15:56:14,230 - INFO - Finished converting document 10-K_2025-02-13 in 6.86 sec.
2025-11-14 15:56:15,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-K_2025-02-13' --> 'data\processed_data\CL\10-K_2025-02-13.md'


2025-11-14 15:56:15,802 - INFO - Going to convert document batch...
2025-11-14 15:56:15,803 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 15:56:16,346 - INFO - Finished converting document 10-Q_2023-04-28 in 1.31 sec.
2025-11-14 15:56:16,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2023-04-28' --> 'data\processed_data\CL\10-Q_2023-04-28.md'


2025-11-14 15:56:17,094 - INFO - Going to convert document batch...
2025-11-14 15:56:17,095 - INFO - Processing document 10-Q_2023-07-28
2025-11-14 15:56:18,234 - INFO - Finished converting document 10-Q_2023-07-28 in 1.61 sec.
2025-11-14 15:56:18,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2023-07-28' --> 'data\processed_data\CL\10-Q_2023-07-28.md'


2025-11-14 15:56:19,140 - INFO - Going to convert document batch...
2025-11-14 15:56:19,140 - INFO - Processing document 10-Q_2023-10-27
2025-11-14 15:56:20,007 - INFO - Finished converting document 10-Q_2023-10-27 in 1.34 sec.
2025-11-14 15:56:20,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2023-10-27' --> 'data\processed_data\CL\10-Q_2023-10-27.md'


2025-11-14 15:56:21,275 - INFO - Going to convert document batch...
2025-11-14 15:56:21,276 - INFO - Processing document 10-Q_2024-04-26
2025-11-14 15:56:22,648 - INFO - Finished converting document 10-Q_2024-04-26 in 2.22 sec.
2025-11-14 15:56:23,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2024-04-26' --> 'data\processed_data\CL\10-Q_2024-04-26.md'


2025-11-14 15:56:24,399 - INFO - Going to convert document batch...
2025-11-14 15:56:24,401 - INFO - Processing document 10-Q_2024-07-26
2025-11-14 15:56:26,449 - INFO - Finished converting document 10-Q_2024-07-26 in 3.14 sec.
2025-11-14 15:56:27,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2024-07-26' --> 'data\processed_data\CL\10-Q_2024-07-26.md'


2025-11-14 15:56:28,862 - INFO - Going to convert document batch...
2025-11-14 15:56:28,864 - INFO - Processing document 10-Q_2024-10-25
2025-11-14 15:56:30,715 - INFO - Finished converting document 10-Q_2024-10-25 in 3.58 sec.
2025-11-14 15:56:31,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2024-10-25' --> 'data\processed_data\CL\10-Q_2024-10-25.md'


2025-11-14 15:56:32,394 - INFO - Going to convert document batch...
2025-11-14 15:56:32,396 - INFO - Processing document 10-Q_2025-04-25
2025-11-14 15:56:33,645 - INFO - Finished converting document 10-Q_2025-04-25 in 2.02 sec.
2025-11-14 15:56:34,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2025-04-25' --> 'data\processed_data\CL\10-Q_2025-04-25.md'


2025-11-14 15:56:35,850 - INFO - Going to convert document batch...
2025-11-14 15:56:35,851 - INFO - Processing document 10-Q_2025-08-01
2025-11-14 15:56:37,428 - INFO - Finished converting document 10-Q_2025-08-01 in 3.23 sec.
2025-11-14 15:56:38,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2025-08-01' --> 'data\processed_data\CL\10-Q_2025-08-01.md'


2025-11-14 15:56:39,328 - INFO - Going to convert document batch...
2025-11-14 15:56:39,330 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 15:56:42,062 - INFO - Finished converting document 10-Q_2025-10-31 in 3.92 sec.
2025-11-14 15:56:43,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,057 - INFO - Going to convert document batch...
2025-11-14 15:56:43,058 - INFO - Processing document 4_2023-01-05
2025-11-14 15:56:43,118 - INFO - Finished converting document 4_2023-01-05 in 0.09 sec.


Converted 'data\edgar_documents\CL\10-Q_2025-10-31' --> 'data\processed_data\CL\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\CL\4_2023-01-05' --> 'data\processed_data\CL\4_2023-01-05.md'


2025-11-14 15:56:43,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,250 - INFO - Going to convert document batch...
2025-11-14 15:56:43,252 - INFO - Processing document 4_2023-02-03
2025-11-14 15:56:43,326 - INFO - Finished converting document 4_2023-02-03 in 0.14 sec.
2025-11-14 15:56:43,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,445 - INFO - Going to convert document batch...
2025-11-14 15:56:43,446 - INFO - Processing document 4_2023-02-17
2025-11-14 15:56:43,489 - INFO - Finished converting document 4_2023-02-17 in 0.09 sec.
2025-11-14 15:56:43,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,572 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CL\4_2023-02-03' --> 'data\processed_data\CL\4_2023-02-03.md'
Converted 'data\edgar_documents\CL\4_2023-02-17' --> 'data\processed_data\CL\4_2023-02-17.md'


2025-11-14 15:56:43,575 - INFO - Processing document 4_2023-02-21
2025-11-14 15:56:43,646 - INFO - Finished converting document 4_2023-02-21 in 0.12 sec.
2025-11-14 15:56:43,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,734 - INFO - Going to convert document batch...
2025-11-14 15:56:43,735 - INFO - Processing document 4_2023-02-23
2025-11-14 15:56:43,793 - INFO - Finished converting document 4_2023-02-23 in 0.12 sec.


Converted 'data\edgar_documents\CL\4_2023-02-21' --> 'data\processed_data\CL\4_2023-02-21.md'
Converted 'data\edgar_documents\CL\4_2023-02-23' --> 'data\processed_data\CL\4_2023-02-23.md'


2025-11-14 15:56:43,897 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:43,899 - ERROR - Input document 4_2023-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56:43,902 - INFO - Going to convert document batch...
2025-11-14 15:56:43,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,952 - INFO - Going to convert document batch...
2025-11-14 15:56:43,953 - INFO - Processing document 4_2023-03-01


Error processing data\edgar_documents\CL\4_2023-02-27: File format not allowed: data\edgar_documents\CL\4_2023-02-27
Converted 'data\edgar_documents\CL\4_2023-03-01' --> 'data\processed_data\CL\4_2023-03-01.md'


2025-11-14 15:56:44,098 - INFO - Going to convert document batch...
2025-11-14 15:56:44,100 - INFO - Processing document 4_2023-03-15
2025-11-14 15:56:44,132 - INFO - Finished converting document 4_2023-03-15 in 0.08 sec.
2025-11-14 15:56:44,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:44,220 - INFO - Going to convert document batch...
2025-11-14 15:56:44,222 - INFO - Processing document 4_2023-04-05
2025-11-14 15:56:44,276 - INFO - Finished converting document 4_2023-04-05 in 0.12 sec.


Converted 'data\edgar_documents\CL\4_2023-03-15' --> 'data\processed_data\CL\4_2023-03-15.md'


2025-11-14 15:56:44,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:44,421 - INFO - Going to convert document batch...
2025-11-14 15:56:44,422 - INFO - Processing document 4_2023-05-05
2025-11-14 15:56:44,486 - INFO - Finished converting document 4_2023-05-05 in 0.14 sec.


Converted 'data\edgar_documents\CL\4_2023-04-05' --> 'data\processed_data\CL\4_2023-04-05.md'
Converted 'data\edgar_documents\CL\4_2023-05-05' --> 'data\processed_data\CL\4_2023-05-05.md'


2025-11-14 15:56:44,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:44,616 - INFO - Going to convert document batch...
2025-11-14 15:56:44,617 - INFO - Processing document 4_2023-05-10
2025-11-14 15:56:44,661 - INFO - Finished converting document 4_2023-05-10 in 0.09 sec.
2025-11-14 15:56:44,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:44,793 - INFO - Going to convert document batch...
2025-11-14 15:56:44,794 - INFO - Processing document 4_2023-05-12
2025-11-14 15:56:44,868 - INFO - Finished converting document 4_2023-05-12 in 0.12 sec.


Converted 'data\edgar_documents\CL\4_2023-05-10' --> 'data\processed_data\CL\4_2023-05-10.md'


2025-11-14 15:56:44,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,029 - INFO - Going to convert document batch...
2025-11-14 15:56:45,031 - INFO - Processing document 4_2023-05-17
2025-11-14 15:56:45,088 - INFO - Finished converting document 4_2023-05-17 in 0.14 sec.


Converted 'data\edgar_documents\CL\4_2023-05-12' --> 'data\processed_data\CL\4_2023-05-12.md'


2025-11-14 15:56:45,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,209 - INFO - Going to convert document batch...
2025-11-14 15:56:45,212 - INFO - Processing document 4_2023-05-23
2025-11-14 15:56:45,262 - INFO - Finished converting document 4_2023-05-23 in 0.11 sec.


Converted 'data\edgar_documents\CL\4_2023-05-17' --> 'data\processed_data\CL\4_2023-05-17.md'
Converted 'data\edgar_documents\CL\4_2023-05-23' --> 'data\processed_data\CL\4_2023-05-23.md'


2025-11-14 15:56:45,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,379 - INFO - Going to convert document batch...
2025-11-14 15:56:45,380 - INFO - Processing document 4_2023-07-06
2025-11-14 15:56:45,420 - INFO - Finished converting document 4_2023-07-06 in 0.09 sec.
2025-11-14 15:56:45,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,539 - INFO - Going to convert document batch...
2025-11-14 15:56:45,540 - INFO - Processing document 4_2023-08-04
2025-11-14 15:56:45,581 - INFO - Finished converting document 4_2023-08-04 in 0.09 sec.
2025-11-14 15:56:45,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,655 - INFO - Going to convert document batch...
2025-11-14 15:56:45,656 - INFO - Processing document 4_2023-09-01


Converted 'data\edgar_documents\CL\4_2023-07-06' --> 'data\processed_data\CL\4_2023-07-06.md'
Converted 'data\edgar_documents\CL\4_2023-08-04' --> 'data\processed_data\CL\4_2023-08-04.md'


2025-11-14 15:56:45,696 - INFO - Finished converting document 4_2023-09-01 in 0.06 sec.
2025-11-14 15:56:45,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,779 - INFO - Going to convert document batch...
2025-11-14 15:56:45,780 - INFO - Processing document 4_2023-09-12
2025-11-14 15:56:45,814 - INFO - Finished converting document 4_2023-09-12 in 0.08 sec.
2025-11-14 15:56:45,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,887 - INFO - Going to convert document batch...
2025-11-14 15:56:45,889 - INFO - Processing document 4_2023-09-13
2025-11-14 15:56:45,936 - INFO - Finished converting document 4_2023-09-13 in 0.09 sec.


Converted 'data\edgar_documents\CL\4_2023-09-01' --> 'data\processed_data\CL\4_2023-09-01.md'
Converted 'data\edgar_documents\CL\4_2023-09-12' --> 'data\processed_data\CL\4_2023-09-12.md'


2025-11-14 15:56:45,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,013 - INFO - Going to convert document batch...
2025-11-14 15:56:46,014 - INFO - Processing document 4_2023-09-15
2025-11-14 15:56:46,057 - INFO - Finished converting document 4_2023-09-15 in 0.09 sec.
2025-11-14 15:56:46,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,149 - INFO - Going to convert document batch...
2025-11-14 15:56:46,150 - INFO - Processing document 4_2023-10-04


Converted 'data\edgar_documents\CL\4_2023-09-13' --> 'data\processed_data\CL\4_2023-09-13.md'
Converted 'data\edgar_documents\CL\4_2023-09-15' --> 'data\processed_data\CL\4_2023-09-15.md'


2025-11-14 15:56:46,203 - INFO - Finished converting document 4_2023-10-04 in 0.11 sec.
2025-11-14 15:56:46,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,281 - INFO - Going to convert document batch...
2025-11-14 15:56:46,283 - INFO - Processing document 4_2023-10-17
2025-11-14 15:56:46,319 - INFO - Finished converting document 4_2023-10-17 in 0.08 sec.
2025-11-14 15:56:46,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\4_2023-10-04' --> 'data\processed_data\CL\4_2023-10-04.md'
Converted 'data\edgar_documents\CL\4_2023-10-17' --> 'data\processed_data\CL\4_2023-10-17.md'


2025-11-14 15:56:46,426 - INFO - Going to convert document batch...
2025-11-14 15:56:46,428 - INFO - Processing document 4_2023-11-06
2025-11-14 15:56:46,468 - INFO - Finished converting document 4_2023-11-06 in 0.09 sec.
2025-11-14 15:56:46,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,556 - INFO - Going to convert document batch...
2025-11-14 15:56:46,557 - INFO - Processing document 4_2023-11-07
2025-11-14 15:56:46,605 - INFO - Finished converting document 4_2023-11-07 in 0.11 sec.


Converted 'data\edgar_documents\CL\4_2023-11-06' --> 'data\processed_data\CL\4_2023-11-06.md'
Converted 'data\edgar_documents\CL\4_2023-11-07' --> 'data\processed_data\CL\4_2023-11-07.md'


2025-11-14 15:56:46,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,708 - INFO - Going to convert document batch...
2025-11-14 15:56:46,710 - INFO - Processing document 4_2023-11-13
2025-11-14 15:56:46,746 - INFO - Finished converting document 4_2023-11-13 in 0.11 sec.
2025-11-14 15:56:46,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,810 - INFO - Going to convert document batch...
2025-11-14 15:56:46,811 - INFO - Processing document 4_2023-11-14
2025-11-14 15:56:46,891 - INFO - Finished converting document 4_2023-11-14 in 0.11 sec.
2025-11-14 15:56:46,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\4_2023-11-13' --> 'data\processed_data\CL\4_2023-11-13.md'
Converted 'data\edgar_documents\CL\4_2023-11-14' --> 'data\processed_data\CL\4_2023-11-14.md'


2025-11-14 15:56:46,993 - INFO - Going to convert document batch...
2025-11-14 15:56:46,994 - INFO - Processing document 4_2023-11-17
2025-11-14 15:56:47,042 - INFO - Finished converting document 4_2023-11-17 in 0.11 sec.
2025-11-14 15:56:47,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,157 - INFO - Going to convert document batch...
2025-11-14 15:56:47,159 - INFO - Processing document 4_2023-11-30
2025-11-14 15:56:47,209 - INFO - Finished converting document 4_2023-11-30 in 0.12 sec.


Converted 'data\edgar_documents\CL\4_2023-11-17' --> 'data\processed_data\CL\4_2023-11-17.md'


2025-11-14 15:56:47,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,353 - INFO - Going to convert document batch...
2025-11-14 15:56:47,355 - INFO - Processing document 4_2023-12-04
2025-11-14 15:56:47,427 - INFO - Finished converting document 4_2023-12-04 in 0.14 sec.


Converted 'data\edgar_documents\CL\4_2023-11-30' --> 'data\processed_data\CL\4_2023-11-30.md'
Converted 'data\edgar_documents\CL\4_2023-12-04' --> 'data\processed_data\CL\4_2023-12-04.md'


2025-11-14 15:56:47,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,516 - INFO - Going to convert document batch...
2025-11-14 15:56:47,517 - INFO - Processing document 4_2023-12-08
2025-11-14 15:56:47,550 - INFO - Finished converting document 4_2023-12-08 in 0.08 sec.
2025-11-14 15:56:47,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,626 - INFO - Going to convert document batch...
2025-11-14 15:56:47,628 - INFO - Processing document 4_2024-01-04
2025-11-14 15:56:47,664 - INFO - Finished converting document 4_2024-01-04 in 0.08 sec.
2025-11-14 15:56:47,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,781 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CL\4_2023-12-08' --> 'data\processed_data\CL\4_2023-12-08.md'
Converted 'data\edgar_documents\CL\4_2024-01-04' --> 'data\processed_data\CL\4_2024-01-04.md'


2025-11-14 15:56:47,782 - INFO - Processing document 4_2024-02-02
2025-11-14 15:56:47,846 - INFO - Finished converting document 4_2024-02-02 in 0.14 sec.
2025-11-14 15:56:47,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,938 - INFO - Going to convert document batch...
2025-11-14 15:56:47,940 - INFO - Processing document 4_2024-02-07
2025-11-14 15:56:47,993 - INFO - Finished converting document 4_2024-02-07 in 0.09 sec.


Converted 'data\edgar_documents\CL\4_2024-02-02' --> 'data\processed_data\CL\4_2024-02-02.md'
Converted 'data\edgar_documents\CL\4_2024-02-07' --> 'data\processed_data\CL\4_2024-02-07.md'


2025-11-14 15:56:48,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,131 - INFO - Going to convert document batch...
2025-11-14 15:56:48,134 - INFO - Processing document 4_2024-02-13
2025-11-14 15:56:48,194 - INFO - Finished converting document 4_2024-02-13 in 0.14 sec.
2025-11-14 15:56:48,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,360 - INFO - Going to convert document batch...
2025-11-14 15:56:48,361 - INFO - Processing document 4_2024-02-14
2025-11-14 15:56:48,429 - INFO - Finished converting document 4_2024-02-14 in 0.17 sec.


Converted 'data\edgar_documents\CL\4_2024-02-13' --> 'data\processed_data\CL\4_2024-02-13.md'


2025-11-14 15:56:48,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,556 - INFO - Going to convert document batch...
2025-11-14 15:56:48,558 - INFO - Processing document 4_2024-02-15
2025-11-14 15:56:48,601 - INFO - Finished converting document 4_2024-02-15 in 0.11 sec.
2025-11-14 15:56:48,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,673 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CL\4_2024-02-14' --> 'data\processed_data\CL\4_2024-02-14.md'
Converted 'data\edgar_documents\CL\4_2024-02-15' --> 'data\processed_data\CL\4_2024-02-15.md'


2025-11-14 15:56:48,674 - INFO - Processing document 4_2024-02-20
2025-11-14 15:56:48,714 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.
2025-11-14 15:56:48,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,787 - INFO - Going to convert document batch...
2025-11-14 15:56:48,788 - INFO - Processing document 4_2024-04-03
2025-11-14 15:56:48,819 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 15:56:48,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,918 - INFO - Going to convert document batch...
2025-11-14 15:56:48,919 - INFO - Processing document 4_2024-05-03
2025-11-14 15:56:48,960 - INFO - Finished converting document 4_2024-05-03 in 0.09 sec.


Converted 'data\edgar_documents\CL\4_2024-02-20' --> 'data\processed_data\CL\4_2024-02-20.md'
Converted 'data\edgar_documents\CL\4_2024-04-03' --> 'data\processed_data\CL\4_2024-04-03.md'


2025-11-14 15:56:49,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,041 - INFO - Going to convert document batch...
2025-11-14 15:56:49,042 - INFO - Processing document 4_2024-05-09
2025-11-14 15:56:49,073 - INFO - Finished converting document 4_2024-05-09 in 0.08 sec.
2025-11-14 15:56:49,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,159 - INFO - Going to convert document batch...
2025-11-14 15:56:49,160 - INFO - Processing document 4_2024-05-10
2025-11-14 15:56:49,202 - INFO - Finished converting document 4_2024-05-10 in 0.09 sec.


Converted 'data\edgar_documents\CL\4_2024-05-03' --> 'data\processed_data\CL\4_2024-05-03.md'
Converted 'data\edgar_documents\CL\4_2024-05-09' --> 'data\processed_data\CL\4_2024-05-09.md'


2025-11-14 15:56:49,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,262 - INFO - Going to convert document batch...
2025-11-14 15:56:49,262 - INFO - Processing document 4_2024-05-15
2025-11-14 15:56:49,300 - INFO - Finished converting document 4_2024-05-15 in 0.06 sec.
2025-11-14 15:56:49,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,397 - INFO - Going to convert document batch...
2025-11-14 15:56:49,399 - INFO - Processing document 4_2024-05-16


Converted 'data\edgar_documents\CL\4_2024-05-10' --> 'data\processed_data\CL\4_2024-05-10.md'
Converted 'data\edgar_documents\CL\4_2024-05-15' --> 'data\processed_data\CL\4_2024-05-15.md'


2025-11-14 15:56:49,459 - INFO - Finished converting document 4_2024-05-16 in 0.09 sec.
2025-11-14 15:56:49,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,548 - INFO - Going to convert document batch...
2025-11-14 15:56:49,550 - INFO - Processing document 4_2024-07-03
2025-11-14 15:56:49,630 - INFO - Finished converting document 4_2024-07-03 in 0.12 sec.
2025-11-14 15:56:49,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\4_2024-05-16' --> 'data\processed_data\CL\4_2024-05-16.md'
Converted 'data\edgar_documents\CL\4_2024-07-03' --> 'data\processed_data\CL\4_2024-07-03.md'


2025-11-14 15:56:49,709 - INFO - Going to convert document batch...
2025-11-14 15:56:49,711 - INFO - Processing document 4_2024-08-02
2025-11-14 15:56:49,750 - INFO - Finished converting document 4_2024-08-02 in 0.09 sec.
2025-11-14 15:56:49,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,819 - INFO - Going to convert document batch...
2025-11-14 15:56:49,819 - INFO - Processing document 4_2024-08-08
2025-11-14 15:56:49,845 - INFO - Finished converting document 4_2024-08-08 in 0.06 sec.
2025-11-14 15:56:49,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,910 - INFO - Going to convert document batch...
2025-11-14 15:56:49,911 - INFO - Processing document 4_2024-08-12
2025-11-14 15:56:49,938 - INFO - Finished converting document 4_2024-08-12 in 0.06 sec.


Converted 'data\edgar_documents\CL\4_2024-08-02' --> 'data\processed_data\CL\4_2024-08-02.md'
Converted 'data\edgar_documents\CL\4_2024-08-08' --> 'data\processed_data\CL\4_2024-08-08.md'


2025-11-14 15:56:49,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,993 - INFO - Going to convert document batch...
2025-11-14 15:56:49,994 - INFO - Processing document 4_2024-08-27
2025-11-14 15:56:50,016 - INFO - Finished converting document 4_2024-08-27 in 0.05 sec.
2025-11-14 15:56:50,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,074 - INFO - Going to convert document batch...
2025-11-14 15:56:50,075 - INFO - Processing document 4_2024-09-12
2025-11-14 15:56:50,095 - INFO - Finished converting document 4_2024-09-12 in 0.05 sec.
2025-11-14 15:56:50,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,147 - INFO - Going to convert document batch...
2025-11-14 15:56:50,147 - INFO - Processing document 4_2024-09-16
2025-11-14 15:56:50,170 - INFO - Finished converting document 4_2024-09-16 in 0.06 sec.


Converted 'data\edgar_documents\CL\4_2024-08-12' --> 'data\processed_data\CL\4_2024-08-12.md'
Converted 'data\edgar_documents\CL\4_2024-08-27' --> 'data\processed_data\CL\4_2024-08-27.md'
Converted 'data\edgar_documents\CL\4_2024-09-12' --> 'data\processed_data\CL\4_2024-09-12.md'


2025-11-14 15:56:50,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,226 - INFO - Going to convert document batch...
2025-11-14 15:56:50,227 - INFO - Processing document 4_2024-10-03
2025-11-14 15:56:50,245 - INFO - Finished converting document 4_2024-10-03 in 0.06 sec.
2025-11-14 15:56:50,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,316 - INFO - Going to convert document batch...
2025-11-14 15:56:50,317 - INFO - Processing document 4_2024-11-05
2025-11-14 15:56:50,336 - INFO - Finished converting document 4_2024-11-05 in 0.06 sec.
2025-11-14 15:56:50,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,376 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CL\4_2024-09-16' --> 'data\processed_data\CL\4_2024-09-16.md'
Converted 'data\edgar_documents\CL\4_2024-10-03' --> 'data\processed_data\CL\4_2024-10-03.md'
Converted 'data\edgar_documents\CL\4_2024-11-05' --> 'data\processed_data\CL\4_2024-11-05.md'


2025-11-14 15:56:50,377 - INFO - Processing document 4_2024-11-07
2025-11-14 15:56:50,399 - INFO - Finished converting document 4_2024-11-07 in 0.03 sec.
2025-11-14 15:56:50,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,454 - INFO - Going to convert document batch...
2025-11-14 15:56:50,455 - INFO - Processing document 4_2024-11-26
2025-11-14 15:56:50,473 - INFO - Finished converting document 4_2024-11-26 in 0.05 sec.
2025-11-14 15:56:50,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,525 - INFO - Going to convert document batch...
2025-11-14 15:56:50,527 - INFO - Processing document 4_2024-11-27
2025-11-14 15:56:50,543 - INFO - Finished converting document 4_2024-11-27 in 0.06 sec.
2025-11-14 15:56:50,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,597 - INFO - Going to convert document batch...
2025-11-14 15:56:50,598 - INFO - Processing document 4_2024-12-05


Converted 'data\edgar_documents\CL\4_2024-11-07' --> 'data\processed_data\CL\4_2024-11-07.md'
Converted 'data\edgar_documents\CL\4_2024-11-26' --> 'data\processed_data\CL\4_2024-11-26.md'
Converted 'data\edgar_documents\CL\4_2024-11-27' --> 'data\processed_data\CL\4_2024-11-27.md'


2025-11-14 15:56:50,615 - INFO - Finished converting document 4_2024-12-05 in 0.05 sec.
2025-11-14 15:56:50,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,665 - INFO - Going to convert document batch...
2025-11-14 15:56:50,665 - INFO - Processing document 4_2025-01-06
2025-11-14 15:56:50,682 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 15:56:50,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,727 - INFO - Going to convert document batch...
2025-11-14 15:56:50,728 - INFO - Processing document 4_2025-02-18
2025-11-14 15:56:50,747 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 15:56:50,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,796 - INFO - Going to convert document batch...
2025-11-14 15:56:50,797 - INFO - Processing document 4_2025-02-27
2025-11-14 15:56:50,815 - INFO - Finished converting document 4_2025-02-27 in 0.05 sec.


Converted 'data\edgar_documents\CL\4_2024-12-05' --> 'data\processed_data\CL\4_2024-12-05.md'
Converted 'data\edgar_documents\CL\4_2025-01-06' --> 'data\processed_data\CL\4_2025-01-06.md'
Converted 'data\edgar_documents\CL\4_2025-02-18' --> 'data\processed_data\CL\4_2025-02-18.md'


2025-11-14 15:56:50,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,867 - INFO - Going to convert document batch...
2025-11-14 15:56:50,868 - INFO - Processing document 4_2025-04-03
2025-11-14 15:56:50,887 - INFO - Finished converting document 4_2025-04-03 in 0.06 sec.
2025-11-14 15:56:50,936 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:50,936 - ERROR - Input document 4_2025-04-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56

Converted 'data\edgar_documents\CL\4_2025-02-27' --> 'data\processed_data\CL\4_2025-02-27.md'
Converted 'data\edgar_documents\CL\4_2025-04-03' --> 'data\processed_data\CL\4_2025-04-03.md'
Error processing data\edgar_documents\CL\4_2025-04-28: File format not allowed: data\edgar_documents\CL\4_2025-04-28
Error processing data\edgar_documents\CL\4_2025-04-30: File format not allowed: data\edgar_documents\CL\4_2025-04-30


2025-11-14 15:56:51,071 - INFO - Finished converting document 4_2025-05-14 in 0.11 sec.
2025-11-14 15:56:51,161 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:51,181 - INFO - Going to convert document batch...
2025-11-14 15:56:51,183 - INFO - Processing document 4_2025-05-19
2025-11-14 15:56:51,222 - INFO - Finished converting document 4_2025-05-19 in 0.08 sec.
2025-11-14 15:56:51,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:51,300 - INFO - Going to convert document batch...
2025-11-14 15:56:51,301 - INFO - Processing document 4_2025-06-18


Converted 'data\edgar_documents\CL\4_2025-05-14' --> 'data\processed_data\CL\4_2025-05-14.md'
Converted 'data\edgar_documents\CL\4_2025-05-19' --> 'data\processed_data\CL\4_2025-05-19.md'


2025-11-14 15:56:51,335 - INFO - Finished converting document 4_2025-06-18 in 0.06 sec.
2025-11-14 15:56:51,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:51,415 - INFO - Going to convert document batch...
2025-11-14 15:56:51,416 - INFO - Processing document 4_2025-07-02
2025-11-14 15:56:51,451 - INFO - Finished converting document 4_2025-07-02 in 0.08 sec.
2025-11-14 15:56:51,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:51,517 - INFO - Going to convert document batch...
2025-11-14 15:56:51,518 - INFO - Processing document 4_2025-09-12
2025-11-14 15:56:51,562 - INFO - Finished converting document 4_2025-09-12 in 0.08 sec.


Converted 'data\edgar_documents\CL\4_2025-06-18' --> 'data\processed_data\CL\4_2025-06-18.md'
Converted 'data\edgar_documents\CL\4_2025-07-02' --> 'data\processed_data\CL\4_2025-07-02.md'


2025-11-14 15:56:51,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\4_2025-09-12' --> 'data\processed_data\CL\4_2025-09-12.md'


2025-11-14 15:56:52,421 - INFO - Going to convert document batch...
2025-11-14 15:56:52,423 - INFO - Processing document 4_2025-09-16
2025-11-14 15:56:52,466 - INFO - Finished converting document 4_2025-09-16 in 0.88 sec.
2025-11-14 15:56:52,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:52,553 - INFO - Going to convert document batch...
2025-11-14 15:56:52,554 - INFO - Processing document 4_2025-10-03
2025-11-14 15:56:52,600 - INFO - Finished converting document 4_2025-10-03 in 0.08 sec.
2025-11-14 15:56:52,677 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:52,678 - ERROR - Input document 4_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\CL\4_2025-09-16' --> 'data\processed_data\CL\4_2025-09-16.md'
Converted 'data\edgar_documents\CL\4_2025-10-03' --> 'data\processed_data\CL\4_2025-10-03.md'
Error processing data\edgar_documents\CL\4_2025-11-03: File format not allowed: data\edgar_documents\CL\4_2025-11-03


2025-11-14 15:56:52,700 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:52,702 - ERROR - Input document 4_2025-11-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56:52,703 - INFO - Going to convert document batch...
2025-11-14 15:56:52,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:52,755 - INFO - Going to convert document batch...
2025-11-14 15:56:52,757 - INFO - Processing document 8-K_2023-01-12
2025-11-14 15:56:52,800 - INFO - F

Error processing data\edgar_documents\CL\4_2025-11-05: File format not allowed: data\edgar_documents\CL\4_2025-11-05
Converted 'data\edgar_documents\CL\8-K_2023-01-12' --> 'data\processed_data\CL\8-K_2023-01-12.md'


2025-11-14 15:56:52,911 - INFO - Finished converting document 8-K_2023-01-27 in 0.09 sec.
2025-11-14 15:56:52,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:52,971 - INFO - Going to convert document batch...
2025-11-14 15:56:52,972 - INFO - Processing document 8-K_2023-01-30
2025-11-14 15:56:53,005 - INFO - Finished converting document 8-K_2023-01-30 in 0.08 sec.
2025-11-14 15:56:53,063 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:53,064 - ERROR - Input document 8-K_2023-03-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS:

Converted 'data\edgar_documents\CL\8-K_2023-01-27' --> 'data\processed_data\CL\8-K_2023-01-27.md'
Converted 'data\edgar_documents\CL\8-K_2023-01-30' --> 'data\processed_data\CL\8-K_2023-01-30.md'
Error processing data\edgar_documents\CL\8-K_2023-03-01: File format not allowed: data\edgar_documents\CL\8-K_2023-03-01


2025-11-14 15:56:53,133 - INFO - Processing document 8-K_2023-04-28
2025-11-14 15:56:53,188 - INFO - Finished converting document 8-K_2023-04-28 in 0.12 sec.
2025-11-14 15:56:53,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,323 - INFO - Going to convert document batch...
2025-11-14 15:56:53,325 - INFO - Processing document 8-K_2023-05-17
2025-11-14 15:56:53,399 - INFO - Finished converting document 8-K_2023-05-17 in 0.19 sec.


Converted 'data\edgar_documents\CL\8-K_2023-04-28' --> 'data\processed_data\CL\8-K_2023-04-28.md'


2025-11-14 15:56:53,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,489 - INFO - Going to convert document batch...
2025-11-14 15:56:53,490 - INFO - Processing document 8-K_2023-07-28
2025-11-14 15:56:53,535 - INFO - Finished converting document 8-K_2023-07-28 in 0.09 sec.
2025-11-14 15:56:53,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,616 - INFO - Going to convert document batch...
2025-11-14 15:56:53,617 - INFO - Processing document 8-K_2023-08-18


Converted 'data\edgar_documents\CL\8-K_2023-05-17' --> 'data\processed_data\CL\8-K_2023-05-17.md'
Converted 'data\edgar_documents\CL\8-K_2023-07-28' --> 'data\processed_data\CL\8-K_2023-07-28.md'


2025-11-14 15:56:53,660 - INFO - Finished converting document 8-K_2023-08-18 in 0.09 sec.
2025-11-14 15:56:53,711 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,742 - INFO - Going to convert document batch...
2025-11-14 15:56:53,744 - INFO - Processing document 8-K_2023-09-15
2025-11-14 15:56:53,784 - INFO - Finished converting document 8-K_2023-09-15 in 0.11 sec.
2025-11-14 15:56:53,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,844 - INFO - Going to convert document batch...
2025-11-14 15:56:53,845 - INFO - Processing document 8-K_2023-10-27


Converted 'data\edgar_documents\CL\8-K_2023-08-18' --> 'data\processed_data\CL\8-K_2023-08-18.md'
Converted 'data\edgar_documents\CL\8-K_2023-09-15' --> 'data\processed_data\CL\8-K_2023-09-15.md'


2025-11-14 15:56:53,896 - INFO - Finished converting document 8-K_2023-10-27 in 0.09 sec.
2025-11-14 15:56:53,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,968 - INFO - Going to convert document batch...
2025-11-14 15:56:53,969 - INFO - Processing document 8-K_2024-01-26
2025-11-14 15:56:54,015 - INFO - Finished converting document 8-K_2024-01-26 in 0.09 sec.
2025-11-14 15:56:54,116 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\CL\8-K_2023-10-27' --> 'data\processed_data\CL\8-K_2023-10-27.md'
Converted 'data\edgar_documents\CL\8-K_2024-01-26' --> 'data\processed_data\CL\8-K_2024-01-26.md'


2025-11-14 15:56:54,120 - ERROR - Input document 8-K_2024-02-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56:54,123 - INFO - Going to convert document batch...
2025-11-14 15:56:54,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:54,206 - INFO - Going to convert document batch...
2025-11-14 15:56:54,207 - INFO - Processing document 8-K_2024-04-26
2025-11-14 15:56:54,247 - INFO - Finished converting document 8-K_2024-04-26 in 0.12 sec.
2025-11-14 15:56:54,297 - INFO -

Error processing data\edgar_documents\CL\8-K_2024-02-15: File format not allowed: data\edgar_documents\CL\8-K_2024-02-15
Converted 'data\edgar_documents\CL\8-K_2024-04-26' --> 'data\processed_data\CL\8-K_2024-04-26.md'


2025-11-14 15:56:54,356 - INFO - Going to convert document batch...
2025-11-14 15:56:54,359 - INFO - Processing document 8-K_2024-05-15
2025-11-14 15:56:54,429 - INFO - Finished converting document 8-K_2024-05-15 in 0.14 sec.
2025-11-14 15:56:54,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:54,522 - INFO - Going to convert document batch...
2025-11-14 15:56:54,524 - INFO - Processing document 8-K_2024-07-26
2025-11-14 15:56:54,574 - INFO - Finished converting document 8-K_2024-07-26 in 0.12 sec.
2025-11-14 15:56:54,637 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\8-K_2024-05-15' --> 'data\processed_data\CL\8-K_2024-05-15.md'
Converted 'data\edgar_documents\CL\8-K_2024-07-26' --> 'data\processed_data\CL\8-K_2024-07-26.md'


2025-11-14 15:56:54,663 - INFO - Going to convert document batch...
2025-11-14 15:56:54,663 - INFO - Processing document 8-K_2024-10-25
2025-11-14 15:56:54,727 - INFO - Finished converting document 8-K_2024-10-25 in 0.12 sec.
2025-11-14 15:56:54,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:54,854 - INFO - Going to convert document batch...
2025-11-14 15:56:54,856 - INFO - Processing document 8-K_2025-01-24
2025-11-14 15:56:54,937 - INFO - Finished converting document 8-K_2025-01-24 in 0.19 sec.


Converted 'data\edgar_documents\CL\8-K_2024-10-25' --> 'data\processed_data\CL\8-K_2024-10-25.md'


2025-11-14 15:56:55,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,041 - INFO - Going to convert document batch...
2025-11-14 15:56:55,043 - INFO - Processing document 8-K_2025-01-31
2025-11-14 15:56:55,109 - INFO - Finished converting document 8-K_2025-01-31 in 0.12 sec.


Converted 'data\edgar_documents\CL\8-K_2025-01-24' --> 'data\processed_data\CL\8-K_2025-01-24.md'
Converted 'data\edgar_documents\CL\8-K_2025-01-31' --> 'data\processed_data\CL\8-K_2025-01-31.md'


2025-11-14 15:56:55,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,243 - INFO - Going to convert document batch...
2025-11-14 15:56:55,244 - INFO - Processing document 8-K_2025-04-25
2025-11-14 15:56:55,371 - INFO - Finished converting document 8-K_2025-04-25 in 0.22 sec.
2025-11-14 15:56:55,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,465 - INFO - Going to convert document batch...
2025-11-14 15:56:55,467 - INFO - Processing document 8-K_2025-05-02
2025-11-14 15:56:55,510 - INFO - Finished converting document 8-K_2025-05-02 in 0.11 sec.
2025-11-14 15:56:55,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\8-K_2025-04-25' --> 'data\processed_data\CL\8-K_2025-04-25.md'
Converted 'data\edgar_documents\CL\8-K_2025-05-02' --> 'data\processed_data\CL\8-K_2025-05-02.md'


2025-11-14 15:56:55,616 - INFO - Going to convert document batch...
2025-11-14 15:56:55,617 - INFO - Processing document 8-K_2025-05-14
2025-11-14 15:56:55,688 - INFO - Finished converting document 8-K_2025-05-14 in 0.16 sec.
2025-11-14 15:56:55,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,762 - INFO - Going to convert document batch...
2025-11-14 15:56:55,763 - INFO - Processing document 8-K_2025-05-29
2025-11-14 15:56:55,798 - INFO - Finished converting document 8-K_2025-05-29 in 0.08 sec.
2025-11-14 15:56:55,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,853 - INFO - Going to convert document batch...
2025-11-14 15:56:55,854 - INFO - Processing document 8-K_2025-08-01
2025-11-14 15:56:55,889 - INFO - Finished converting document 8-K_2025-08-01 in 0.08 sec.


Converted 'data\edgar_documents\CL\8-K_2025-05-14' --> 'data\processed_data\CL\8-K_2025-05-14.md'
Converted 'data\edgar_documents\CL\8-K_2025-05-29' --> 'data\processed_data\CL\8-K_2025-05-29.md'


2025-11-14 15:56:55,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,978 - INFO - Going to convert document batch...
2025-11-14 15:56:55,980 - INFO - Processing document 8-K_2025-10-31
2025-11-14 15:56:56,035 - INFO - Finished converting document 8-K_2025-10-31 in 0.11 sec.
2025-11-14 15:56:56,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\8-K_2025-08-01' --> 'data\processed_data\CL\8-K_2025-08-01.md'
Converted 'data\edgar_documents\CL\8-K_2025-10-31' --> 'data\processed_data\CL\8-K_2025-10-31.md'


2025-11-14 15:56:56,146 - INFO - Going to convert document batch...
2025-11-14 15:56:56,148 - INFO - Processing document 8-K_2025-11-10
2025-11-14 15:56:56,206 - INFO - Finished converting document 8-K_2025-11-10 in 0.12 sec.
2025-11-14 15:56:56,332 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:56,333 - ERROR - Input document DEF-14A_2023-03-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56:56,336 - INFO - Going to convert 

Converted 'data\edgar_documents\CL\8-K_2025-11-10' --> 'data\processed_data\CL\8-K_2025-11-10.md'
Error processing data\edgar_documents\CL\DEF-14A_2023-03-29: File format not allowed: data\edgar_documents\CL\DEF-14A_2023-03-29


2025-11-14 15:56:57,799 - INFO - Going to convert document batch...
2025-11-14 15:56:57,800 - INFO - Processing document DEF-14A_2024-03-27
2025-11-14 15:57:17,015 - INFO - Finished converting document DEF-14A_2024-03-27 in 20.67 sec.
2025-11-14 15:57:19,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\DEF-14A_2024-03-27' --> 'data\processed_data\CL\DEF-14A_2024-03-27.md'


2025-11-14 15:57:21,316 - INFO - Going to convert document batch...
2025-11-14 15:57:21,318 - INFO - Processing document DEF-14A_2025-03-26
2025-11-14 15:57:52,496 - INFO - Finished converting document DEF-14A_2025-03-26 in 33.39 sec.
2025-11-14 15:57:53,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\DEF-14A_2025-03-26' --> 'data\processed_data\CL\DEF-14A_2025-03-26.md'
Processed 103 new files. Errors: 8
Found 141 files to process in data\edgar_documents\CMCSA


2025-11-14 15:57:54,413 - INFO - Going to convert document batch...
2025-11-14 15:57:54,414 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:57:54,415 - INFO - Processing document 10-K_2023-02-03
2025-11-14 15:57:55,912 - INFO - Finished converting document 10-K_2023-02-03 in 2.41 sec.
2025-11-14 15:57:56,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-K_2023-02-03' --> 'data\processed_data\CMCSA\10-K_2023-02-03.md'


2025-11-14 15:57:57,281 - INFO - Going to convert document batch...
2025-11-14 15:57:57,282 - INFO - Processing document 10-K_2024-01-31
2025-11-14 15:57:58,775 - INFO - Finished converting document 10-K_2024-01-31 in 2.11 sec.
2025-11-14 15:57:59,716 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-K_2024-01-31' --> 'data\processed_data\CMCSA\10-K_2024-01-31.md'


2025-11-14 15:58:00,265 - INFO - Going to convert document batch...
2025-11-14 15:58:00,266 - INFO - Processing document 10-K_2025-01-31
2025-11-14 15:58:01,791 - INFO - Finished converting document 10-K_2025-01-31 in 2.12 sec.
2025-11-14 15:58:02,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-K_2025-01-31' --> 'data\processed_data\CMCSA\10-K_2025-01-31.md'


2025-11-14 15:58:03,074 - INFO - Going to convert document batch...
2025-11-14 15:58:03,074 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 15:58:03,684 - INFO - Finished converting document 10-Q_2023-04-27 in 1.30 sec.
2025-11-14 15:58:04,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2023-04-27' --> 'data\processed_data\CMCSA\10-Q_2023-04-27.md'


2025-11-14 15:58:04,424 - INFO - Going to convert document batch...
2025-11-14 15:58:04,426 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 15:58:05,513 - INFO - Finished converting document 10-Q_2023-07-27 in 1.52 sec.
2025-11-14 15:58:05,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2023-07-27' --> 'data\processed_data\CMCSA\10-Q_2023-07-27.md'


2025-11-14 15:58:06,325 - INFO - Going to convert document batch...
2025-11-14 15:58:06,326 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 15:58:07,066 - INFO - Finished converting document 10-Q_2023-10-26 in 1.16 sec.
2025-11-14 15:58:07,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2023-10-26' --> 'data\processed_data\CMCSA\10-Q_2023-10-26.md'


2025-11-14 15:58:07,735 - INFO - Going to convert document batch...
2025-11-14 15:58:07,736 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 15:58:08,568 - INFO - Finished converting document 10-Q_2024-04-25 in 1.12 sec.
2025-11-14 15:58:08,898 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2024-04-25' --> 'data\processed_data\CMCSA\10-Q_2024-04-25.md'


2025-11-14 15:58:09,237 - INFO - Going to convert document batch...
2025-11-14 15:58:09,237 - INFO - Processing document 10-Q_2024-07-23
2025-11-14 15:58:09,888 - INFO - Finished converting document 10-Q_2024-07-23 in 1.03 sec.
2025-11-14 15:58:10,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2024-07-23' --> 'data\processed_data\CMCSA\10-Q_2024-07-23.md'


2025-11-14 15:58:10,933 - INFO - Going to convert document batch...
2025-11-14 15:58:10,933 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 15:58:11,579 - INFO - Finished converting document 10-Q_2024-10-31 in 1.38 sec.
2025-11-14 15:58:11,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2024-10-31' --> 'data\processed_data\CMCSA\10-Q_2024-10-31.md'


2025-11-14 15:58:12,185 - INFO - Going to convert document batch...
2025-11-14 15:58:12,186 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 15:58:12,707 - INFO - Finished converting document 10-Q_2025-04-24 in 0.80 sec.
2025-11-14 15:58:13,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2025-04-24' --> 'data\processed_data\CMCSA\10-Q_2025-04-24.md'


2025-11-14 15:58:13,659 - INFO - Going to convert document batch...
2025-11-14 15:58:13,660 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 15:58:14,301 - INFO - Finished converting document 10-Q_2025-07-31 in 1.33 sec.
2025-11-14 15:58:14,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2025-07-31' --> 'data\processed_data\CMCSA\10-Q_2025-07-31.md'


2025-11-14 15:58:15,047 - INFO - Going to convert document batch...
2025-11-14 15:58:15,047 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 15:58:15,723 - INFO - Finished converting document 10-Q_2025-10-30 in 1.09 sec.
2025-11-14 15:58:16,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,109 - INFO - Going to convert document batch...
2025-11-14 15:58:16,109 - INFO - Processing document 4_2023-01-04
2025-11-14 15:58:16,127 - INFO - Finished converting document 4_2023-01-04 in 0.06 sec.
2025-11-14 15:58:16,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,182 - INFO - Going to convert document batch...
2025-11-14 15:58:16,183 - INFO - Processing document 4_2023-01-05
2025-11-14 15:58:16,201 - INFO - Finished converting document 4_2023-01-05 in 0.06 sec.
2025-11-14 15:58:16,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,238 - INFO - Going to convert document batch...
2025-11-14 15:58:16,

Converted 'data\edgar_documents\CMCSA\10-Q_2025-10-30' --> 'data\processed_data\CMCSA\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\CMCSA\4_2023-01-04' --> 'data\processed_data\CMCSA\4_2023-01-04.md'
Converted 'data\edgar_documents\CMCSA\4_2023-01-05' --> 'data\processed_data\CMCSA\4_2023-01-05.md'


2025-11-14 15:58:16,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,297 - INFO - Going to convert document batch...
2025-11-14 15:58:16,299 - INFO - Processing document 4_2023-01-09
2025-11-14 15:58:16,317 - INFO - Finished converting document 4_2023-01-09 in 0.03 sec.
2025-11-14 15:58:16,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,372 - INFO - Going to convert document batch...
2025-11-14 15:58:16,373 - INFO - Processing document 4_2023-01-27
2025-11-14 15:58:16,389 - INFO - Finished converting document 4_2023-01-27 in 0.06 sec.
2025-11-14 15:58:16,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,453 - INFO - Going to convert document batch...
2025-11-14 15:58:16,454 - INFO - Processing document 4_2023-01-30


Converted 'data\edgar_documents\CMCSA\4_2023-01-06' --> 'data\processed_data\CMCSA\4_2023-01-06.md'
Converted 'data\edgar_documents\CMCSA\4_2023-01-09' --> 'data\processed_data\CMCSA\4_2023-01-09.md'
Converted 'data\edgar_documents\CMCSA\4_2023-01-27' --> 'data\processed_data\CMCSA\4_2023-01-27.md'


2025-11-14 15:58:16,481 - INFO - Finished converting document 4_2023-01-30 in 0.08 sec.
2025-11-14 15:58:16,512 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,525 - INFO - Going to convert document batch...
2025-11-14 15:58:16,526 - INFO - Processing document 4_2023-02-01
2025-11-14 15:58:16,558 - INFO - Finished converting document 4_2023-02-01 in 0.06 sec.
2025-11-14 15:58:16,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,607 - INFO - Going to convert document batch...
2025-11-14 15:58:16,608 - INFO - Processing document 4_2023-02-06
2025-11-14 15:58:16,640 - INFO - Finished converting document 4_2023-02-06 in 0.06 sec.


Converted 'data\edgar_documents\CMCSA\4_2023-01-30' --> 'data\processed_data\CMCSA\4_2023-01-30.md'
Converted 'data\edgar_documents\CMCSA\4_2023-02-01' --> 'data\processed_data\CMCSA\4_2023-02-01.md'
Converted 'data\edgar_documents\CMCSA\4_2023-02-06' --> 'data\processed_data\CMCSA\4_2023-02-06.md'


2025-11-14 15:58:16,710 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:16,711 - ERROR - Input document 4_2023-02-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:58:16,713 - INFO - Going to convert document batch...
2025-11-14 15:58:16,735 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:16,736 - ERROR - Input document 4_2023-02-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\CMCSA\4_2023-02-07: File format not allowed: data\edgar_documents\CMCSA\4_2023-02-07
Error processing data\edgar_documents\CMCSA\4_2023-02-08: File format not allowed: data\edgar_documents\CMCSA\4_2023-02-08
Converted 'data\edgar_documents\CMCSA\4_2023-02-16' --> 'data\processed_data\CMCSA\4_2023-02-16.md'


2025-11-14 15:58:17,091 - INFO - Going to convert document batch...
2025-11-14 15:58:17,091 - INFO - Processing document 4_2023-02-21
2025-11-14 15:58:17,124 - INFO - Finished converting document 4_2023-02-21 in 0.33 sec.
2025-11-14 15:58:17,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,173 - INFO - Going to convert document batch...
2025-11-14 15:58:17,173 - INFO - Processing document 4_2023-03-03
2025-11-14 15:58:17,196 - INFO - Finished converting document 4_2023-03-03 in 0.03 sec.
2025-11-14 15:58:17,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,233 - INFO - Going to convert document batch...
2025-11-14 15:58:17,234 - INFO - Processing document 4_2023-03-09
2025-11-14 15:58:17,251 - INFO - Finished converting document 4_2023-03-09 in 0.03 sec.
2025-11-14 15:58:17,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,287 - INFO - Going to convert document batch...
2025-11-14 15:58:17,288 - 

Converted 'data\edgar_documents\CMCSA\4_2023-02-21' --> 'data\processed_data\CMCSA\4_2023-02-21.md'
Converted 'data\edgar_documents\CMCSA\4_2023-03-03' --> 'data\processed_data\CMCSA\4_2023-03-03.md'
Converted 'data\edgar_documents\CMCSA\4_2023-03-09' --> 'data\processed_data\CMCSA\4_2023-03-09.md'
Converted 'data\edgar_documents\CMCSA\4_2023-03-17' --> 'data\processed_data\CMCSA\4_2023-03-17.md'


2025-11-14 15:58:17,353 - INFO - Going to convert document batch...
2025-11-14 15:58:17,355 - INFO - Processing document 4_2023-03-30
2025-11-14 15:58:17,373 - INFO - Finished converting document 4_2023-03-30 in 0.06 sec.
2025-11-14 15:58:17,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,417 - INFO - Going to convert document batch...
2025-11-14 15:58:17,418 - INFO - Processing document 4_2023-04-04
2025-11-14 15:58:17,435 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.
2025-11-14 15:58:17,473 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:17,474 - ERROR - Input document 4_2023-05-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\CMCSA\4_2023-03-30' --> 'data\processed_data\CMCSA\4_2023-03-30.md'
Converted 'data\edgar_documents\CMCSA\4_2023-04-04' --> 'data\processed_data\CMCSA\4_2023-04-04.md'
Error processing data\edgar_documents\CMCSA\4_2023-05-02: File format not allowed: data\edgar_documents\CMCSA\4_2023-05-02
Converted 'data\edgar_documents\CMCSA\4_2023-05-24' --> 'data\processed_data\CMCSA\4_2023-05-24.md'


2025-11-14 15:58:17,579 - INFO - Processing document 4_2023-06-06
2025-11-14 15:58:17,599 - INFO - Finished converting document 4_2023-06-06 in 0.05 sec.
2025-11-14 15:58:17,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,642 - INFO - Going to convert document batch...
2025-11-14 15:58:17,643 - INFO - Processing document 4_2023-06-14
2025-11-14 15:58:17,660 - INFO - Finished converting document 4_2023-06-14 in 0.03 sec.
2025-11-14 15:58:17,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,701 - INFO - Going to convert document batch...
2025-11-14 15:58:17,701 - INFO - Processing document 4_2023-06-21
2025-11-14 15:58:17,721 - INFO - Finished converting document 4_2023-06-21 in 0.03 sec.
2025-11-14 15:58:17,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,785 - INFO - Going to convert document batch...
2025-11-14 15:58:17,786 - INFO - Processing document 4_2023-07-05
2025-11-14 15:58:17,805 - IN

Converted 'data\edgar_documents\CMCSA\4_2023-06-06' --> 'data\processed_data\CMCSA\4_2023-06-06.md'
Converted 'data\edgar_documents\CMCSA\4_2023-06-14' --> 'data\processed_data\CMCSA\4_2023-06-14.md'
Converted 'data\edgar_documents\CMCSA\4_2023-06-21' --> 'data\processed_data\CMCSA\4_2023-06-21.md'
Converted 'data\edgar_documents\CMCSA\4_2023-07-05' --> 'data\processed_data\CMCSA\4_2023-07-05.md'


2025-11-14 15:58:17,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,868 - INFO - Going to convert document batch...
2025-11-14 15:58:17,870 - INFO - Processing document 4_2023-08-07
2025-11-14 15:58:17,890 - INFO - Finished converting document 4_2023-08-07 in 0.06 sec.
2025-11-14 15:58:17,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,928 - INFO - Going to convert document batch...
2025-11-14 15:58:17,929 - INFO - Processing document 4_2023-08-30
2025-11-14 15:58:17,944 - INFO - Finished converting document 4_2023-08-30 in 0.03 sec.
2025-11-14 15:58:17,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,980 - INFO - Going to convert document batch...
2025-11-14 15:58:17,980 - INFO - Processing document 4_2023-10-03
2025-11-14 15:58:17,997 - INFO - Finished converting document 4_2023-10-03 in 0.05 sec.
2025-11-14 15:58:18,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\4_2023-08-07' --> 'data\processed_data\CMCSA\4_2023-08-07.md'
Converted 'data\edgar_documents\CMCSA\4_2023-08-30' --> 'data\processed_data\CMCSA\4_2023-08-30.md'
Converted 'data\edgar_documents\CMCSA\4_2023-10-03' --> 'data\processed_data\CMCSA\4_2023-10-03.md'
Converted 'data\edgar_documents\CMCSA\4_2023-10-05' --> 'data\processed_data\CMCSA\4_2023-10-05.md'


2025-11-14 15:58:18,104 - INFO - Going to convert document batch...
2025-11-14 15:58:18,105 - INFO - Processing document 4_2023-11-15
2025-11-14 15:58:18,124 - INFO - Finished converting document 4_2023-11-15 in 0.05 sec.
2025-11-14 15:58:18,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,172 - INFO - Going to convert document batch...
2025-11-14 15:58:18,174 - INFO - Processing document 4_2023-11-22
2025-11-14 15:58:18,202 - INFO - Finished converting document 4_2023-11-22 in 0.06 sec.
2025-11-14 15:58:18,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,244 - INFO - Going to convert document batch...
2025-11-14 15:58:18,245 - INFO - Processing document 4_2023-12-06
2025-11-14 15:58:18,278 - INFO - Finished converting document 4_2023-12-06 in 0.06 sec.
2025-11-14 15:58:18,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,326 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CMCSA\4_2023-11-15' --> 'data\processed_data\CMCSA\4_2023-11-15.md'
Converted 'data\edgar_documents\CMCSA\4_2023-11-22' --> 'data\processed_data\CMCSA\4_2023-11-22.md'
Converted 'data\edgar_documents\CMCSA\4_2023-12-06' --> 'data\processed_data\CMCSA\4_2023-12-06.md'


2025-11-14 15:58:18,327 - INFO - Processing document 4_2023-12-18
2025-11-14 15:58:18,345 - INFO - Finished converting document 4_2023-12-18 in 0.03 sec.
2025-11-14 15:58:18,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,382 - INFO - Going to convert document batch...
2025-11-14 15:58:18,383 - INFO - Processing document 4_2024-01-03
2025-11-14 15:58:18,401 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:58:18,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,437 - INFO - Going to convert document batch...
2025-11-14 15:58:18,438 - INFO - Processing document 4_2024-01-04
2025-11-14 15:58:18,454 - INFO - Finished converting document 4_2024-01-04 in 0.03 sec.
2025-11-14 15:58:18,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,494 - INFO - Going to convert document batch...
2025-11-14 15:58:18,495 - INFO - Processing document 4_2024-01-08
2025-11-14 15:58:18,513 - IN

Converted 'data\edgar_documents\CMCSA\4_2023-12-18' --> 'data\processed_data\CMCSA\4_2023-12-18.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-03' --> 'data\processed_data\CMCSA\4_2024-01-03.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-04' --> 'data\processed_data\CMCSA\4_2024-01-04.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-08' --> 'data\processed_data\CMCSA\4_2024-01-08.md'


2025-11-14 15:58:18,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,564 - INFO - Going to convert document batch...
2025-11-14 15:58:18,565 - INFO - Processing document 4_2024-01-16
2025-11-14 15:58:18,586 - INFO - Finished converting document 4_2024-01-16 in 0.05 sec.
2025-11-14 15:58:18,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,625 - INFO - Going to convert document batch...
2025-11-14 15:58:18,626 - INFO - Processing document 4_2024-01-29
2025-11-14 15:58:18,642 - INFO - Finished converting document 4_2024-01-29 in 0.03 sec.
2025-11-14 15:58:18,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,700 - INFO - Going to convert document batch...
2025-11-14 15:58:18,701 - INFO - Processing document 4_2024-01-30
2025-11-14 15:58:18,725 - INFO - Finished converting document 4_2024-01-30 in 0.06 sec.
2025-11-14 15:58:18,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\4_2024-01-16' --> 'data\processed_data\CMCSA\4_2024-01-16.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-29' --> 'data\processed_data\CMCSA\4_2024-01-29.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-30' --> 'data\processed_data\CMCSA\4_2024-01-30.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-31' --> 'data\processed_data\CMCSA\4_2024-01-31.md'


2025-11-14 15:58:18,822 - INFO - Going to convert document batch...
2025-11-14 15:58:18,822 - INFO - Processing document 4_2024-02-16
2025-11-14 15:58:18,840 - INFO - Finished converting document 4_2024-02-16 in 0.05 sec.
2025-11-14 15:58:18,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,882 - INFO - Going to convert document batch...
2025-11-14 15:58:18,883 - INFO - Processing document 4_2024-03-05
2025-11-14 15:58:18,907 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 15:58:18,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,972 - INFO - Going to convert document batch...
2025-11-14 15:58:18,973 - INFO - Processing document 4_2024-03-11
2025-11-14 15:58:18,991 - INFO - Finished converting document 4_2024-03-11 in 0.06 sec.
2025-11-14 15:58:19,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,047 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CMCSA\4_2024-02-16' --> 'data\processed_data\CMCSA\4_2024-02-16.md'
Converted 'data\edgar_documents\CMCSA\4_2024-03-05' --> 'data\processed_data\CMCSA\4_2024-03-05.md'
Converted 'data\edgar_documents\CMCSA\4_2024-03-11' --> 'data\processed_data\CMCSA\4_2024-03-11.md'


2025-11-14 15:58:19,048 - INFO - Processing document 4_2024-03-19
2025-11-14 15:58:19,069 - INFO - Finished converting document 4_2024-03-19 in 0.06 sec.
2025-11-14 15:58:19,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,109 - INFO - Going to convert document batch...
2025-11-14 15:58:19,109 - INFO - Processing document 4_2024-04-01
2025-11-14 15:58:19,131 - INFO - Finished converting document 4_2024-04-01 in 0.03 sec.
2025-11-14 15:58:19,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,185 - INFO - Going to convert document batch...
2025-11-14 15:58:19,185 - INFO - Processing document 4_2024-04-02
2025-11-14 15:58:19,201 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 15:58:19,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,239 - INFO - Going to convert document batch...
2025-11-14 15:58:19,239 - INFO - Processing document 4_2024-04-17
2025-11-14 15:58:19,257 - IN

Converted 'data\edgar_documents\CMCSA\4_2024-03-19' --> 'data\processed_data\CMCSA\4_2024-03-19.md'
Converted 'data\edgar_documents\CMCSA\4_2024-04-01' --> 'data\processed_data\CMCSA\4_2024-04-01.md'
Converted 'data\edgar_documents\CMCSA\4_2024-04-02' --> 'data\processed_data\CMCSA\4_2024-04-02.md'
Converted 'data\edgar_documents\CMCSA\4_2024-04-17' --> 'data\processed_data\CMCSA\4_2024-04-17.md'


2025-11-14 15:58:19,293 - INFO - Going to convert document batch...
2025-11-14 15:58:19,294 - INFO - Processing document 4_2024-05-13
2025-11-14 15:58:19,312 - INFO - Finished converting document 4_2024-05-13 in 0.03 sec.
2025-11-14 15:58:19,347 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:19,348 - ERROR - Input document 4_2024-05-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:58:19,349 - INFO - Going to convert document batch...
2025-11-14 15:58:19,359 - IN

Converted 'data\edgar_documents\CMCSA\4_2024-05-13' --> 'data\processed_data\CMCSA\4_2024-05-13.md'
Error processing data\edgar_documents\CMCSA\4_2024-05-21: File format not allowed: data\edgar_documents\CMCSA\4_2024-05-21
Converted 'data\edgar_documents\CMCSA\4_2024-05-23' --> 'data\processed_data\CMCSA\4_2024-05-23.md'
Converted 'data\edgar_documents\CMCSA\4_2024-06-07' --> 'data\processed_data\CMCSA\4_2024-06-07.md'


2025-11-14 15:58:19,516 - INFO - Processing document 4_2024-06-20
2025-11-14 15:58:19,535 - INFO - Finished converting document 4_2024-06-20 in 0.05 sec.
2025-11-14 15:58:19,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,573 - INFO - Going to convert document batch...
2025-11-14 15:58:19,574 - INFO - Processing document 4_2024-07-01
2025-11-14 15:58:19,589 - INFO - Finished converting document 4_2024-07-01 in 0.05 sec.
2025-11-14 15:58:19,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,644 - INFO - Going to convert document batch...
2025-11-14 15:58:19,644 - INFO - Processing document 4_2024-09-18
2025-11-14 15:58:19,661 - INFO - Finished converting document 4_2024-09-18 in 0.05 sec.
2025-11-14 15:58:19,698 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:19,699 - ERROR - Input document 4_2024-09-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>

Converted 'data\edgar_documents\CMCSA\4_2024-06-20' --> 'data\processed_data\CMCSA\4_2024-06-20.md'
Converted 'data\edgar_documents\CMCSA\4_2024-07-01' --> 'data\processed_data\CMCSA\4_2024-07-01.md'
Converted 'data\edgar_documents\CMCSA\4_2024-09-18' --> 'data\processed_data\CMCSA\4_2024-09-18.md'
Error processing data\edgar_documents\CMCSA\4_2024-09-23: File format not allowed: data\edgar_documents\CMCSA\4_2024-09-23
Error processing data\edgar_documents\CMCSA\4_2024-09-25: File format not allowed: data\edgar_documents\CMCSA\4_2024-09-25


2025-11-14 15:58:19,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,739 - INFO - Going to convert document batch...
2025-11-14 15:58:19,740 - INFO - Processing document 4_2024-10-01
2025-11-14 15:58:19,778 - INFO - Finished converting document 4_2024-10-01 in 0.06 sec.
2025-11-14 15:58:19,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,821 - INFO - Going to convert document batch...
2025-11-14 15:58:19,822 - INFO - Processing document 4_2024-11-05
2025-11-14 15:58:19,839 - INFO - Finished converting document 4_2024-11-05 in 0.05 sec.
2025-11-14 15:58:19,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,906 - INFO - Going to convert document batch...
2025-11-14 15:58:19,907 - INFO - Processing document 4_2024-11-07
2025-11-14 15:58:19,929 - INFO - Finished converting document 4_2024-11-07 in 0.06 sec.
2025-11-14 15:58:19,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\4_2024-10-01' --> 'data\processed_data\CMCSA\4_2024-10-01.md'
Converted 'data\edgar_documents\CMCSA\4_2024-11-05' --> 'data\processed_data\CMCSA\4_2024-11-05.md'
Converted 'data\edgar_documents\CMCSA\4_2024-11-07' --> 'data\processed_data\CMCSA\4_2024-11-07.md'


2025-11-14 15:58:20,013 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,020 - INFO - Going to convert document batch...
2025-11-14 15:58:20,021 - INFO - Processing document 4_2024-11-25
2025-11-14 15:58:20,038 - INFO - Finished converting document 4_2024-11-25 in 0.03 sec.
2025-11-14 15:58:20,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,096 - INFO - Going to convert document batch...
2025-11-14 15:58:20,097 - INFO - Processing document 4_2024-11-29
2025-11-14 15:58:20,115 - INFO - Finished converting document 4_2024-11-29 in 0.06 sec.
2025-11-14 15:58:20,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,151 - INFO - Going to convert document batch...
2025-11-14 15:58:20,153 - INFO - Processing document 4_2024-12-03
2025-11-14 15:58:20,170 - INFO - Finished converting document 4_2024-12-03 in 0.05 sec.
2025-11-14 15:58:20,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\4_2024-11-22' --> 'data\processed_data\CMCSA\4_2024-11-22.md'
Converted 'data\edgar_documents\CMCSA\4_2024-11-25' --> 'data\processed_data\CMCSA\4_2024-11-25.md'
Converted 'data\edgar_documents\CMCSA\4_2024-11-29' --> 'data\processed_data\CMCSA\4_2024-11-29.md'
Converted 'data\edgar_documents\CMCSA\4_2024-12-03' --> 'data\processed_data\CMCSA\4_2024-12-03.md'


2025-11-14 15:58:20,207 - INFO - Going to convert document batch...
2025-11-14 15:58:20,209 - INFO - Processing document 4_2025-01-03
2025-11-14 15:58:20,225 - INFO - Finished converting document 4_2025-01-03 in 0.03 sec.
2025-11-14 15:58:20,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,264 - INFO - Going to convert document batch...
2025-11-14 15:58:20,264 - INFO - Processing document 4_2025-01-06
2025-11-14 15:58:20,288 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 15:58:20,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,329 - INFO - Going to convert document batch...
2025-11-14 15:58:20,330 - INFO - Processing document 4_2025-01-15
2025-11-14 15:58:20,349 - INFO - Finished converting document 4_2025-01-15 in 0.03 sec.
2025-11-14 15:58:20,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,404 - INFO - Going to convert document batch...
2025-11-14 15:58:20,404 - 

Converted 'data\edgar_documents\CMCSA\4_2025-01-03' --> 'data\processed_data\CMCSA\4_2025-01-03.md'
Converted 'data\edgar_documents\CMCSA\4_2025-01-06' --> 'data\processed_data\CMCSA\4_2025-01-06.md'
Converted 'data\edgar_documents\CMCSA\4_2025-01-15' --> 'data\processed_data\CMCSA\4_2025-01-15.md'


2025-11-14 15:58:20,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,463 - INFO - Going to convert document batch...
2025-11-14 15:58:20,464 - INFO - Processing document 4_2025-03-04
2025-11-14 15:58:20,485 - INFO - Finished converting document 4_2025-03-04 in 0.05 sec.
2025-11-14 15:58:20,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,525 - INFO - Going to convert document batch...
2025-11-14 15:58:20,526 - INFO - Processing document 4_2025-03-07
2025-11-14 15:58:20,546 - INFO - Finished converting document 4_2025-03-07 in 0.05 sec.
2025-11-14 15:58:20,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,585 - INFO - Going to convert document batch...
2025-11-14 15:58:20,586 - INFO - Processing document 4_2025-03-10
2025-11-14 15:58:20,602 - INFO - Finished converting document 4_2025-03-10 in 0.03 sec.
2025-11-14 15:58:20,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\4_2025-02-27' --> 'data\processed_data\CMCSA\4_2025-02-27.md'
Converted 'data\edgar_documents\CMCSA\4_2025-03-04' --> 'data\processed_data\CMCSA\4_2025-03-04.md'
Converted 'data\edgar_documents\CMCSA\4_2025-03-07' --> 'data\processed_data\CMCSA\4_2025-03-07.md'
Converted 'data\edgar_documents\CMCSA\4_2025-03-10' --> 'data\processed_data\CMCSA\4_2025-03-10.md'


2025-11-14 15:58:20,636 - INFO - Going to convert document batch...
2025-11-14 15:58:20,637 - INFO - Processing document 4_2025-03-19
2025-11-14 15:58:20,654 - INFO - Finished converting document 4_2025-03-19 in 0.03 sec.
2025-11-14 15:58:20,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,694 - INFO - Going to convert document batch...
2025-11-14 15:58:20,695 - INFO - Processing document 4_2025-04-02
2025-11-14 15:58:20,712 - INFO - Finished converting document 4_2025-04-02 in 0.03 sec.
2025-11-14 15:58:20,749 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:20,750 - ERROR - Input document 4_2025-05-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\CMCSA\4_2025-03-19' --> 'data\processed_data\CMCSA\4_2025-03-19.md'
Converted 'data\edgar_documents\CMCSA\4_2025-04-02' --> 'data\processed_data\CMCSA\4_2025-04-02.md'
Error processing data\edgar_documents\CMCSA\4_2025-05-06: File format not allowed: data\edgar_documents\CMCSA\4_2025-05-06
Converted 'data\edgar_documents\CMCSA\4_2025-05-07' --> 'data\processed_data\CMCSA\4_2025-05-07.md'
Converted 'data\edgar_documents\CMCSA\4_2025-05-15' --> 'data\processed_data\CMCSA\4_2025-05-15.md'


2025-11-14 15:58:20,881 - INFO - Going to convert document batch...
2025-11-14 15:58:20,882 - INFO - Processing document 4_2025-05-23
2025-11-14 15:58:20,901 - INFO - Finished converting document 4_2025-05-23 in 0.05 sec.
2025-11-14 15:58:20,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,941 - INFO - Going to convert document batch...
2025-11-14 15:58:20,942 - INFO - Processing document 4_2025-06-06


Converted 'data\edgar_documents\CMCSA\4_2025-05-23' --> 'data\processed_data\CMCSA\4_2025-05-23.md'


2025-11-14 15:58:21,160 - INFO - Finished converting document 4_2025-06-06 in 0.23 sec.
2025-11-14 15:58:21,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,199 - INFO - Going to convert document batch...
2025-11-14 15:58:21,199 - INFO - Processing document 4_2025-06-20
2025-11-14 15:58:21,217 - INFO - Finished converting document 4_2025-06-20 in 0.05 sec.
2025-11-14 15:58:21,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,270 - INFO - Going to convert document batch...
2025-11-14 15:58:21,271 - INFO - Processing document 4_2025-07-02
2025-11-14 15:58:21,288 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 15:58:21,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,331 - INFO - Going to convert document batch...
2025-11-14 15:58:21,331 - INFO - Processing document 4_2025-08-07
2025-11-14 15:58:21,358 - INFO - Finished converting document 4_2025-08-07 in 0.05 sec.


Converted 'data\edgar_documents\CMCSA\4_2025-06-06' --> 'data\processed_data\CMCSA\4_2025-06-06.md'
Converted 'data\edgar_documents\CMCSA\4_2025-06-20' --> 'data\processed_data\CMCSA\4_2025-06-20.md'
Converted 'data\edgar_documents\CMCSA\4_2025-07-02' --> 'data\processed_data\CMCSA\4_2025-07-02.md'


2025-11-14 15:58:21,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,404 - INFO - Going to convert document batch...
2025-11-14 15:58:21,405 - INFO - Processing document 4_2025-08-21
2025-11-14 15:58:21,422 - INFO - Finished converting document 4_2025-08-21 in 0.05 sec.
2025-11-14 15:58:21,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,457 - INFO - Going to convert document batch...
2025-11-14 15:58:21,458 - INFO - Processing document 4_2025-09-04
2025-11-14 15:58:21,475 - INFO - Finished converting document 4_2025-09-04 in 0.03 sec.
2025-11-14 15:58:21,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,512 - INFO - Going to convert document batch...
2025-11-14 15:58:21,513 - INFO - Processing document 4_2025-10-02
2025-11-14 15:58:21,530 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 15:58:21,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\4_2025-08-07' --> 'data\processed_data\CMCSA\4_2025-08-07.md'
Converted 'data\edgar_documents\CMCSA\4_2025-08-21' --> 'data\processed_data\CMCSA\4_2025-08-21.md'
Converted 'data\edgar_documents\CMCSA\4_2025-09-04' --> 'data\processed_data\CMCSA\4_2025-09-04.md'
Converted 'data\edgar_documents\CMCSA\4_2025-10-02' --> 'data\processed_data\CMCSA\4_2025-10-02.md'


2025-11-14 15:58:21,567 - INFO - Going to convert document batch...
2025-11-14 15:58:21,568 - INFO - Processing document 4_2025-11-05
2025-11-14 15:58:21,604 - INFO - Finished converting document 4_2025-11-05 in 0.05 sec.
2025-11-14 15:58:21,649 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,664 - INFO - Going to convert document batch...
2025-11-14 15:58:21,664 - INFO - Processing document 8-K_2023-01-06
2025-11-14 15:58:21,693 - INFO - Finished converting document 8-K_2023-01-06 in 0.06 sec.
2025-11-14 15:58:21,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,741 - INFO - Going to convert document batch...
2025-11-14 15:58:21,741 - INFO - Processing document 8-K_2023-01-26
2025-11-14 15:58:21,765 - INFO - Finished converting document 8-K_2023-01-26 in 0.06 sec.
2025-11-14 15:58:21,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,810 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CMCSA\4_2025-11-05' --> 'data\processed_data\CMCSA\4_2025-11-05.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-01-06' --> 'data\processed_data\CMCSA\8-K_2023-01-06.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-01-26' --> 'data\processed_data\CMCSA\8-K_2023-01-26.md'


2025-11-14 15:58:21,811 - INFO - Processing document 8-K_2023-02-09
2025-11-14 15:58:21,834 - INFO - Finished converting document 8-K_2023-02-09 in 0.05 sec.
2025-11-14 15:58:21,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,878 - INFO - Going to convert document batch...
2025-11-14 15:58:21,879 - INFO - Processing document 8-K_2023-03-13
2025-11-14 15:58:21,904 - INFO - Finished converting document 8-K_2023-03-13 in 0.06 sec.
2025-11-14 15:58:21,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,995 - INFO - Going to convert document batch...
2025-11-14 15:58:21,995 - INFO - Processing document 8-K_2023-03-15
2025-11-14 15:58:22,018 - INFO - Finished converting document 8-K_2023-03-15 in 0.09 sec.
2025-11-14 15:58:22,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\8-K_2023-02-09' --> 'data\processed_data\CMCSA\8-K_2023-02-09.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-03-13' --> 'data\processed_data\CMCSA\8-K_2023-03-13.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-03-15' --> 'data\processed_data\CMCSA\8-K_2023-03-15.md'


2025-11-14 15:58:22,059 - INFO - Going to convert document batch...
2025-11-14 15:58:22,060 - INFO - Processing document 8-K_2023-04-21
2025-11-14 15:58:22,079 - INFO - Finished converting document 8-K_2023-04-21 in 0.05 sec.
2025-11-14 15:58:22,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,118 - INFO - Going to convert document batch...
2025-11-14 15:58:22,118 - INFO - Processing document 8-K_2023-04-24
2025-11-14 15:58:22,138 - INFO - Finished converting document 8-K_2023-04-24 in 0.05 sec.
2025-11-14 15:58:22,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,181 - INFO - Going to convert document batch...
2025-11-14 15:58:22,181 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:58:22,205 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 15:58:22,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,248 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\8-K_2023-04-21' --> 'data\processed_data\CMCSA\8-K_2023-04-21.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-04-24' --> 'data\processed_data\CMCSA\8-K_2023-04-24.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-04-27' --> 'data\processed_data\CMCSA\8-K_2023-04-27.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-05-01' --> 'data\processed_data\CMCSA\8-K_2023-05-01.md'


2025-11-14 15:58:22,311 - INFO - Going to convert document batch...
2025-11-14 15:58:22,311 - INFO - Processing document 8-K_2023-05-08
2025-11-14 15:58:22,335 - INFO - Finished converting document 8-K_2023-05-08 in 0.05 sec.
2025-11-14 15:58:22,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,378 - INFO - Going to convert document batch...
2025-11-14 15:58:22,378 - INFO - Processing document 8-K_2023-05-09
2025-11-14 15:58:22,405 - INFO - Finished converting document 8-K_2023-05-09 in 0.06 sec.
2025-11-14 15:58:22,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,461 - INFO - Going to convert document batch...
2025-11-14 15:58:22,462 - INFO - Processing document 8-K_2023-06-09
2025-11-14 15:58:22,524 - INFO - Finished converting document 8-K_2023-06-09 in 0.09 sec.


Converted 'data\edgar_documents\CMCSA\8-K_2023-05-08' --> 'data\processed_data\CMCSA\8-K_2023-05-08.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-05-09' --> 'data\processed_data\CMCSA\8-K_2023-05-09.md'


2025-11-14 15:58:22,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,587 - INFO - Going to convert document batch...
2025-11-14 15:58:22,588 - INFO - Processing document 8-K_2023-07-27
2025-11-14 15:58:22,613 - INFO - Finished converting document 8-K_2023-07-27 in 0.06 sec.
2025-11-14 15:58:22,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,657 - INFO - Going to convert document batch...
2025-11-14 15:58:22,658 - INFO - Processing document 8-K_2023-09-11
2025-11-14 15:58:22,681 - INFO - Finished converting document 8-K_2023-09-11 in 0.05 sec.
2025-11-14 15:58:22,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\8-K_2023-06-09' --> 'data\processed_data\CMCSA\8-K_2023-06-09.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-07-27' --> 'data\processed_data\CMCSA\8-K_2023-07-27.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-09-11' --> 'data\processed_data\CMCSA\8-K_2023-09-11.md'


2025-11-14 15:58:22,755 - INFO - Going to convert document batch...
2025-11-14 15:58:22,756 - INFO - Processing document 8-K_2023-10-03
2025-11-14 15:58:22,780 - INFO - Finished converting document 8-K_2023-10-03 in 0.08 sec.
2025-11-14 15:58:22,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,827 - INFO - Going to convert document batch...
2025-11-14 15:58:22,828 - INFO - Processing document 8-K_2023-10-26
2025-11-14 15:58:22,851 - INFO - Finished converting document 8-K_2023-10-26 in 0.05 sec.
2025-11-14 15:58:22,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,896 - INFO - Going to convert document batch...
2025-11-14 15:58:22,896 - INFO - Processing document 8-K_2023-12-06
2025-11-14 15:58:22,921 - INFO - Finished converting document 8-K_2023-12-06 in 0.06 sec.
2025-11-14 15:58:22,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,993 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CMCSA\8-K_2023-10-03' --> 'data\processed_data\CMCSA\8-K_2023-10-03.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-10-26' --> 'data\processed_data\CMCSA\8-K_2023-10-26.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-12-06' --> 'data\processed_data\CMCSA\8-K_2023-12-06.md'


2025-11-14 15:58:22,994 - INFO - Processing document 8-K_2024-01-25
2025-11-14 15:58:23,028 - INFO - Finished converting document 8-K_2024-01-25 in 0.09 sec.
2025-11-14 15:58:23,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,090 - INFO - Going to convert document batch...
2025-11-14 15:58:23,091 - INFO - Processing document 8-K_2024-04-15
2025-11-14 15:58:23,112 - INFO - Finished converting document 8-K_2024-04-15 in 0.05 sec.
2025-11-14 15:58:23,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,155 - INFO - Going to convert document batch...
2025-11-14 15:58:23,157 - INFO - Processing document 8-K_2024-04-25
2025-11-14 15:58:23,181 - INFO - Finished converting document 8-K_2024-04-25 in 0.05 sec.
2025-11-14 15:58:23,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,226 - INFO - Going to convert document batch...
2025-11-14 15:58:23,227 - INFO - Processing document 8-K_2024-05-17
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\8-K_2024-01-25' --> 'data\processed_data\CMCSA\8-K_2024-01-25.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-04-15' --> 'data\processed_data\CMCSA\8-K_2024-04-15.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-04-25' --> 'data\processed_data\CMCSA\8-K_2024-04-25.md'


2025-11-14 15:58:23,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,300 - INFO - Going to convert document batch...
2025-11-14 15:58:23,301 - INFO - Processing document 8-K_2024-05-22
2025-11-14 15:58:23,323 - INFO - Finished converting document 8-K_2024-05-22 in 0.06 sec.
2025-11-14 15:58:23,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,396 - INFO - Going to convert document batch...
2025-11-14 15:58:23,397 - INFO - Processing document 8-K_2024-06-12
2025-11-14 15:58:23,434 - INFO - Finished converting document 8-K_2024-06-12 in 0.11 sec.


Converted 'data\edgar_documents\CMCSA\8-K_2024-05-17' --> 'data\processed_data\CMCSA\8-K_2024-05-17.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-05-22' --> 'data\processed_data\CMCSA\8-K_2024-05-22.md'


2025-11-14 15:58:23,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,480 - INFO - Going to convert document batch...
2025-11-14 15:58:23,481 - INFO - Processing document 8-K_2024-07-23
2025-11-14 15:58:23,507 - INFO - Finished converting document 8-K_2024-07-23 in 0.05 sec.
2025-11-14 15:58:23,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,566 - INFO - Going to convert document batch...
2025-11-14 15:58:23,567 - INFO - Processing document 8-K_2024-09-23
2025-11-14 15:58:23,583 - INFO - Finished converting document 8-K_2024-09-23 in 0.06 sec.
2025-11-14 15:58:23,605 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,618 - INFO - Going to convert document batch...
2025-11-14 15:58:23,618 - INFO - Processing document 8-K_2024-09-26
2025-11-14 15:58:23,638 - INFO - Finished converting document 8-K_2024-09-26 in 0.05 sec.


Converted 'data\edgar_documents\CMCSA\8-K_2024-06-12' --> 'data\processed_data\CMCSA\8-K_2024-06-12.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-07-23' --> 'data\processed_data\CMCSA\8-K_2024-07-23.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-09-23' --> 'data\processed_data\CMCSA\8-K_2024-09-23.md'


2025-11-14 15:58:23,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,679 - INFO - Going to convert document batch...
2025-11-14 15:58:23,679 - INFO - Processing document 8-K_2024-10-31
2025-11-14 15:58:23,705 - INFO - Finished converting document 8-K_2024-10-31 in 0.06 sec.
2025-11-14 15:58:23,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,750 - INFO - Going to convert document batch...
2025-11-14 15:58:23,750 - INFO - Processing document 8-K_2025-01-30
2025-11-14 15:58:23,774 - INFO - Finished converting document 8-K_2025-01-30 in 0.05 sec.
2025-11-14 15:58:23,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,819 - INFO - Going to convert document batch...
2025-11-14 15:58:23,820 - INFO - Processing document 8-K_2025-03-19


Converted 'data\edgar_documents\CMCSA\8-K_2024-09-26' --> 'data\processed_data\CMCSA\8-K_2024-09-26.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-10-31' --> 'data\processed_data\CMCSA\8-K_2024-10-31.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-01-30' --> 'data\processed_data\CMCSA\8-K_2025-01-30.md'


2025-11-14 15:58:24,046 - INFO - Finished converting document 8-K_2025-03-19 in 0.25 sec.
2025-11-14 15:58:24,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,088 - INFO - Going to convert document batch...
2025-11-14 15:58:24,089 - INFO - Processing document 8-K_2025-04-24
2025-11-14 15:58:24,114 - INFO - Finished converting document 8-K_2025-04-24 in 0.05 sec.
2025-11-14 15:58:24,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,157 - INFO - Going to convert document batch...
2025-11-14 15:58:24,158 - INFO - Processing document 8-K_2025-05-05
2025-11-14 15:58:24,177 - INFO - Finished converting document 8-K_2025-05-05 in 0.05 sec.
2025-11-14 15:58:24,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,210 - INFO - Going to convert document batch...
2025-11-14 15:58:24,211 - INFO - Processing document 8-K_2025-05-08
2025-11-14 15:58:24,232 - INFO - Finished converting document 8-K_2025-05-08 in 0.

Converted 'data\edgar_documents\CMCSA\8-K_2025-03-19' --> 'data\processed_data\CMCSA\8-K_2025-03-19.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-04-24' --> 'data\processed_data\CMCSA\8-K_2025-04-24.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-05-05' --> 'data\processed_data\CMCSA\8-K_2025-05-05.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-05-08' --> 'data\processed_data\CMCSA\8-K_2025-05-08.md'


2025-11-14 15:58:24,280 - INFO - Going to convert document batch...
2025-11-14 15:58:24,280 - INFO - Processing document 8-K_2025-06-20
2025-11-14 15:58:24,323 - INFO - Finished converting document 8-K_2025-06-20 in 0.09 sec.
2025-11-14 15:58:24,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,374 - INFO - Going to convert document batch...
2025-11-14 15:58:24,374 - INFO - Processing document 8-K_2025-07-31
2025-11-14 15:58:24,400 - INFO - Finished converting document 8-K_2025-07-31 in 0.05 sec.
2025-11-14 15:58:24,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,449 - INFO - Going to convert document batch...
2025-11-14 15:58:24,450 - INFO - Processing document 8-K_2025-08-22
2025-11-14 15:58:24,474 - INFO - Finished converting document 8-K_2025-08-22 in 0.05 sec.
2025-11-14 15:58:24,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,514 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\8-K_2025-06-20' --> 'data\processed_data\CMCSA\8-K_2025-06-20.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-07-31' --> 'data\processed_data\CMCSA\8-K_2025-07-31.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-08-22' --> 'data\processed_data\CMCSA\8-K_2025-08-22.md'


2025-11-14 15:58:24,539 - INFO - Finished converting document 8-K_2025-09-22 in 0.05 sec.
2025-11-14 15:58:24,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,610 - INFO - Going to convert document batch...
2025-11-14 15:58:24,612 - INFO - Processing document 8-K_2025-09-26
2025-11-14 15:58:24,641 - INFO - Finished converting document 8-K_2025-09-26 in 0.09 sec.
2025-11-14 15:58:24,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,682 - INFO - Going to convert document batch...
2025-11-14 15:58:24,682 - INFO - Processing document 8-K_2025-09-29
2025-11-14 15:58:24,705 - INFO - Finished converting document 8-K_2025-09-29 in 0.05 sec.
2025-11-14 15:58:24,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\8-K_2025-09-22' --> 'data\processed_data\CMCSA\8-K_2025-09-22.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-09-26' --> 'data\processed_data\CMCSA\8-K_2025-09-26.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-09-29' --> 'data\processed_data\CMCSA\8-K_2025-09-29.md'


2025-11-14 15:58:24,749 - INFO - Going to convert document batch...
2025-11-14 15:58:24,751 - INFO - Processing document 8-K_2025-10-01
2025-11-14 15:58:24,777 - INFO - Finished converting document 8-K_2025-10-01 in 0.06 sec.
2025-11-14 15:58:24,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,847 - INFO - Going to convert document batch...
2025-11-14 15:58:24,848 - INFO - Processing document 8-K_2025-10-02
2025-11-14 15:58:24,875 - INFO - Finished converting document 8-K_2025-10-02 in 0.08 sec.
2025-11-14 15:58:24,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,946 - INFO - Going to convert document batch...
2025-11-14 15:58:24,947 - INFO - Processing document 8-K_2025-10-06
2025-11-14 15:58:24,971 - INFO - Finished converting document 8-K_2025-10-06 in 0.08 sec.
2025-11-14 15:58:24,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\8-K_2025-10-01' --> 'data\processed_data\CMCSA\8-K_2025-10-01.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-10-02' --> 'data\processed_data\CMCSA\8-K_2025-10-02.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-10-06' --> 'data\processed_data\CMCSA\8-K_2025-10-06.md'


2025-11-14 15:58:25,013 - INFO - Going to convert document batch...
2025-11-14 15:58:25,014 - INFO - Processing document 8-K_2025-10-08
2025-11-14 15:58:25,039 - INFO - Finished converting document 8-K_2025-10-08 in 0.05 sec.
2025-11-14 15:58:25,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:25,083 - INFO - Going to convert document batch...
2025-11-14 15:58:25,083 - INFO - Processing document 8-K_2025-10-09
2025-11-14 15:58:25,112 - INFO - Finished converting document 8-K_2025-10-09 in 0.06 sec.
2025-11-14 15:58:25,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:25,180 - INFO - Going to convert document batch...
2025-11-14 15:58:25,181 - INFO - Processing document 8-K_2025-10-30
2025-11-14 15:58:25,205 - INFO - Finished converting document 8-K_2025-10-30 in 0.08 sec.


Converted 'data\edgar_documents\CMCSA\8-K_2025-10-08' --> 'data\processed_data\CMCSA\8-K_2025-10-08.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-10-09' --> 'data\processed_data\CMCSA\8-K_2025-10-09.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-10-30' --> 'data\processed_data\CMCSA\8-K_2025-10-30.md'


2025-11-14 15:58:25,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:25,872 - INFO - Going to convert document batch...
2025-11-14 15:58:25,874 - INFO - Processing document DEF-14A_2023-04-28
2025-11-14 15:58:32,164 - INFO - Finished converting document DEF-14A_2023-04-28 in 6.94 sec.
2025-11-14 15:58:33,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\DEF-14A_2023-04-28' --> 'data\processed_data\CMCSA\DEF-14A_2023-04-28.md'


2025-11-14 15:58:33,678 - INFO - Going to convert document batch...
2025-11-14 15:58:33,679 - INFO - Processing document DEF-14A_2024-04-26
2025-11-14 15:58:38,579 - INFO - Finished converting document DEF-14A_2024-04-26 in 5.50 sec.
2025-11-14 15:58:39,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\DEF-14A_2024-04-26' --> 'data\processed_data\CMCSA\DEF-14A_2024-04-26.md'


2025-11-14 15:58:39,683 - INFO - Going to convert document batch...
2025-11-14 15:58:39,683 - INFO - Processing document DEF-14A_2025-04-25
2025-11-14 15:58:46,691 - INFO - Finished converting document DEF-14A_2025-04-25 in 7.45 sec.
2025-11-14 15:58:47,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\DEF-14A_2025-04-25' --> 'data\processed_data\CMCSA\DEF-14A_2025-04-25.md'
Processed 134 new files. Errors: 7
Found 186 files to process in data\edgar_documents\COF


2025-11-14 15:58:49,953 - INFO - Going to convert document batch...
2025-11-14 15:58:49,953 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:58:49,954 - INFO - Processing document 10-K_2023-02-24
2025-11-14 15:59:04,935 - INFO - Finished converting document 10-K_2023-02-24 in 17.34 sec.


Converted 'data\edgar_documents\COF\10-K_2023-02-24' --> 'data\processed_data\COF\10-K_2023-02-24.md'


2025-11-14 15:59:09,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:59:15,242 - INFO - Going to convert document batch...
2025-11-14 15:59:15,244 - INFO - Processing document 10-K_2024-02-23
2025-11-14 15:59:30,339 - INFO - Finished converting document 10-K_2024-02-23 in 20.84 sec.


Converted 'data\edgar_documents\COF\10-K_2024-02-23' --> 'data\processed_data\COF\10-K_2024-02-23.md'


2025-11-14 15:59:34,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:59:39,181 - INFO - Going to convert document batch...
2025-11-14 15:59:39,182 - INFO - Processing document 10-K_2025-02-20
2025-11-14 15:59:55,743 - INFO - Finished converting document 10-K_2025-02-20 in 20.95 sec.
2025-11-14 16:00:01,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-K_2025-02-20' --> 'data\processed_data\COF\10-K_2025-02-20.md'


2025-11-14 16:00:07,347 - INFO - Going to convert document batch...
2025-11-14 16:00:07,348 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 16:00:17,523 - INFO - Finished converting document 10-Q_2023-05-05 in 16.62 sec.
2025-11-14 16:00:21,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2023-05-05' --> 'data\processed_data\COF\10-Q_2023-05-05.md'


2025-11-14 16:00:23,836 - INFO - Going to convert document batch...
2025-11-14 16:00:23,837 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 16:00:29,023 - INFO - Finished converting document 10-Q_2023-07-27 in 7.80 sec.
2025-11-14 16:00:31,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2023-07-27' --> 'data\processed_data\COF\10-Q_2023-07-27.md'


2025-11-14 16:00:33,840 - INFO - Going to convert document batch...
2025-11-14 16:00:33,841 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 16:00:38,662 - INFO - Finished converting document 10-Q_2023-11-02 in 7.80 sec.
2025-11-14 16:00:40,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2023-11-02' --> 'data\processed_data\COF\10-Q_2023-11-02.md'


2025-11-14 16:00:42,976 - INFO - Going to convert document batch...
2025-11-14 16:00:42,977 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 16:00:49,911 - INFO - Finished converting document 10-Q_2024-05-02 in 9.34 sec.


Converted 'data\edgar_documents\COF\10-Q_2024-05-02' --> 'data\processed_data\COF\10-Q_2024-05-02.md'


2025-11-14 16:00:54,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:01:02,359 - INFO - Going to convert document batch...
2025-11-14 16:01:02,360 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 16:01:17,373 - INFO - Finished converting document 10-Q_2024-08-01 in 23.03 sec.


Converted 'data\edgar_documents\COF\10-Q_2024-08-01' --> 'data\processed_data\COF\10-Q_2024-08-01.md'


2025-11-14 16:01:22,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:01:30,995 - INFO - Going to convert document batch...
2025-11-14 16:01:30,998 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 16:01:44,426 - INFO - Finished converting document 10-Q_2024-10-31 in 21.97 sec.
2025-11-14 16:01:49,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2024-10-31' --> 'data\processed_data\COF\10-Q_2024-10-31.md'


2025-11-14 16:01:55,396 - INFO - Going to convert document batch...
2025-11-14 16:01:55,397 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 16:01:59,481 - INFO - Finished converting document 10-Q_2025-05-07 in 9.89 sec.
2025-11-14 16:02:02,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2025-05-07' --> 'data\processed_data\COF\10-Q_2025-05-07.md'


2025-11-14 16:02:04,860 - INFO - Going to convert document batch...
2025-11-14 16:02:04,861 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 16:02:13,233 - INFO - Finished converting document 10-Q_2025-07-31 in 10.98 sec.


Converted 'data\edgar_documents\COF\10-Q_2025-07-31' --> 'data\processed_data\COF\10-Q_2025-07-31.md'


2025-11-14 16:02:19,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:27,768 - INFO - Going to convert document batch...
2025-11-14 16:02:27,769 - INFO - Processing document 10-Q_2025-11-03
2025-11-14 16:02:44,022 - INFO - Finished converting document 10-Q_2025-11-03 in 24.50 sec.
2025-11-14 16:02:52,601 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:52,602 - ERROR - Input document 4_2023-01-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-1

Converted 'data\edgar_documents\COF\10-Q_2025-11-03' --> 'data\processed_data\COF\10-Q_2025-11-03.md'
Error processing data\edgar_documents\COF\4_2023-01-25: File format not allowed: data\edgar_documents\COF\4_2023-01-25
Error processing data\edgar_documents\COF\4_2023-01-26: File format not allowed: data\edgar_documents\COF\4_2023-01-26


2025-11-14 16:02:52,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:52,827 - INFO - Going to convert document batch...
2025-11-14 16:02:52,829 - INFO - Processing document 4_2023-02-02
2025-11-14 16:02:52,869 - INFO - Finished converting document 4_2023-02-02 in 0.08 sec.
2025-11-14 16:02:52,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:52,936 - INFO - Going to convert document batch...
2025-11-14 16:02:52,936 - INFO - Processing document 4_2023-02-16
2025-11-14 16:02:52,966 - INFO - Finished converting document 4_2023-02-16 in 0.06 sec.


Converted 'data\edgar_documents\COF\4_2023-01-30' --> 'data\processed_data\COF\4_2023-01-30.md'
Converted 'data\edgar_documents\COF\4_2023-02-02' --> 'data\processed_data\COF\4_2023-02-02.md'


2025-11-14 16:02:53,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,066 - INFO - Going to convert document batch...
2025-11-14 16:02:53,068 - INFO - Processing document 4_2023-02-17
2025-11-14 16:02:53,126 - INFO - Finished converting document 4_2023-02-17 in 0.11 sec.
2025-11-14 16:02:53,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,194 - INFO - Going to convert document batch...
2025-11-14 16:02:53,196 - INFO - Processing document 4_2023-03-03


Converted 'data\edgar_documents\COF\4_2023-02-16' --> 'data\processed_data\COF\4_2023-02-16.md'
Converted 'data\edgar_documents\COF\4_2023-02-17' --> 'data\processed_data\COF\4_2023-02-17.md'


2025-11-14 16:02:53,232 - INFO - Finished converting document 4_2023-03-03 in 0.08 sec.
2025-11-14 16:02:53,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,297 - INFO - Going to convert document batch...
2025-11-14 16:02:53,299 - INFO - Processing document 4_2023-05-08
2025-11-14 16:02:53,337 - INFO - Finished converting document 4_2023-05-08 in 0.06 sec.
2025-11-14 16:02:53,409 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:53,410 - ERROR - Input document 4_2023-06-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\COF\4_2023-03-03' --> 'data\processed_data\COF\4_2023-03-03.md'
Converted 'data\edgar_documents\COF\4_2023-05-08' --> 'data\processed_data\COF\4_2023-05-08.md'
Error processing data\edgar_documents\COF\4_2023-06-05: File format not allowed: data\edgar_documents\COF\4_2023-06-05
Error processing data\edgar_documents\COF\4_2023-06-06: File format not allowed: data\edgar_documents\COF\4_2023-06-06


2025-11-14 16:02:53,465 - INFO - Going to convert document batch...
2025-11-14 16:02:53,466 - INFO - Processing document 4_2023-07-20
2025-11-14 16:02:53,511 - INFO - Finished converting document 4_2023-07-20 in 0.08 sec.
2025-11-14 16:02:53,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,604 - INFO - Going to convert document batch...
2025-11-14 16:02:53,605 - INFO - Processing document 4_2023-07-26
2025-11-14 16:02:53,648 - INFO - Finished converting document 4_2023-07-26 in 0.08 sec.
2025-11-14 16:02:53,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,755 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\4_2023-07-20' --> 'data\processed_data\COF\4_2023-07-20.md'
Converted 'data\edgar_documents\COF\4_2023-07-26' --> 'data\processed_data\COF\4_2023-07-26.md'


2025-11-14 16:02:53,756 - INFO - Processing document 4_2023-07-27
2025-11-14 16:02:53,795 - INFO - Finished converting document 4_2023-07-27 in 0.09 sec.
2025-11-14 16:02:53,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,874 - INFO - Going to convert document batch...
2025-11-14 16:02:53,875 - INFO - Processing document 4_2023-07-28
2025-11-14 16:02:53,937 - INFO - Finished converting document 4_2023-07-28 in 0.11 sec.
2025-11-14 16:02:54,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,029 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\4_2023-07-27' --> 'data\processed_data\COF\4_2023-07-27.md'
Converted 'data\edgar_documents\COF\4_2023-07-28' --> 'data\processed_data\COF\4_2023-07-28.md'


2025-11-14 16:02:54,030 - INFO - Processing document 4_2023-08-01
2025-11-14 16:02:54,079 - INFO - Finished converting document 4_2023-08-01 in 0.09 sec.
2025-11-14 16:02:54,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,164 - INFO - Going to convert document batch...
2025-11-14 16:02:54,165 - INFO - Processing document 4_2023-08-03
2025-11-14 16:02:54,215 - INFO - Finished converting document 4_2023-08-03 in 0.09 sec.
2025-11-14 16:02:54,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,326 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\4_2023-08-01' --> 'data\processed_data\COF\4_2023-08-01.md'
Converted 'data\edgar_documents\COF\4_2023-08-03' --> 'data\processed_data\COF\4_2023-08-03.md'


2025-11-14 16:02:54,328 - INFO - Processing document 4_2023-08-04
2025-11-14 16:02:54,372 - INFO - Finished converting document 4_2023-08-04 in 0.11 sec.
2025-11-14 16:02:54,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,455 - INFO - Going to convert document batch...
2025-11-14 16:02:54,456 - INFO - Processing document 4_2023-08-08
2025-11-14 16:02:54,507 - INFO - Finished converting document 4_2023-08-08 in 0.09 sec.
2025-11-14 16:02:54,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\4_2023-08-04' --> 'data\processed_data\COF\4_2023-08-04.md'
Converted 'data\edgar_documents\COF\4_2023-08-08' --> 'data\processed_data\COF\4_2023-08-08.md'


2025-11-14 16:02:54,636 - INFO - Going to convert document batch...
2025-11-14 16:02:54,639 - INFO - Processing document 4_2023-08-11
2025-11-14 16:02:54,719 - INFO - Finished converting document 4_2023-08-11 in 0.16 sec.
2025-11-14 16:02:54,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,808 - INFO - Going to convert document batch...
2025-11-14 16:02:54,809 - INFO - Processing document 4_2023-08-15
2025-11-14 16:02:54,847 - INFO - Finished converting document 4_2023-08-15 in 0.08 sec.
2025-11-14 16:02:54,911 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:54,911 - ERROR - Input document 4_2023-10-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\COF\4_2023-08-11' --> 'data\processed_data\COF\4_2023-08-11.md'
Converted 'data\edgar_documents\COF\4_2023-08-15' --> 'data\processed_data\COF\4_2023-08-15.md'
Error processing data\edgar_documents\COF\4_2023-10-27: File format not allowed: data\edgar_documents\COF\4_2023-10-27
Error processing data\edgar_documents\COF\4_2023-10-30: File format not allowed: data\edgar_documents\COF\4_2023-10-30


2025-11-14 16:02:54,973 - INFO - Going to convert document batch...
2025-11-14 16:02:54,974 - INFO - Processing document 4_2023-11-01
2025-11-14 16:02:55,055 - INFO - Finished converting document 4_2023-11-01 in 0.11 sec.
2025-11-14 16:02:55,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:55,165 - INFO - Going to convert document batch...
2025-11-14 16:02:55,166 - INFO - Processing document 4_2023-11-03
2025-11-14 16:02:55,277 - INFO - Finished converting document 4_2023-11-03 in 0.17 sec.


Converted 'data\edgar_documents\COF\4_2023-11-01' --> 'data\processed_data\COF\4_2023-11-01.md'


2025-11-14 16:02:55,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:55,422 - INFO - Going to convert document batch...
2025-11-14 16:02:55,423 - INFO - Processing document 4_2023-11-07
2025-11-14 16:02:55,512 - INFO - Finished converting document 4_2023-11-07 in 0.16 sec.


Converted 'data\edgar_documents\COF\4_2023-11-03' --> 'data\processed_data\COF\4_2023-11-03.md'


2025-11-14 16:02:55,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:55,614 - INFO - Going to convert document batch...
2025-11-14 16:02:55,615 - INFO - Processing document 4_2023-11-09
2025-11-14 16:02:55,676 - INFO - Finished converting document 4_2023-11-09 in 0.09 sec.
2025-11-14 16:02:55,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\4_2023-11-07' --> 'data\processed_data\COF\4_2023-11-07.md'
Converted 'data\edgar_documents\COF\4_2023-11-09' --> 'data\processed_data\COF\4_2023-11-09.md'


2025-11-14 16:02:55,812 - INFO - Going to convert document batch...
2025-11-14 16:02:55,813 - INFO - Processing document 4_2023-11-14
2025-11-14 16:02:55,870 - INFO - Finished converting document 4_2023-11-14 in 0.14 sec.
2025-11-14 16:02:55,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:55,957 - INFO - Going to convert document batch...
2025-11-14 16:02:55,958 - INFO - Processing document 4_2023-11-17
2025-11-14 16:02:55,996 - INFO - Finished converting document 4_2023-11-17 in 0.08 sec.
2025-11-14 16:02:56,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:56,084 - INFO - Going to convert document batch...
2025-11-14 16:02:56,086 - INFO - Processing document 4_2023-12-14
2025-11-14 16:02:56,127 - INFO - Finished converting document 4_2023-12-14 in 0.09 sec.


Converted 'data\edgar_documents\COF\4_2023-11-14' --> 'data\processed_data\COF\4_2023-11-14.md'
Converted 'data\edgar_documents\COF\4_2023-11-17' --> 'data\processed_data\COF\4_2023-11-17.md'


2025-11-14 16:02:56,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:56,224 - INFO - Going to convert document batch...
2025-11-14 16:02:56,226 - INFO - Processing document 4_2023-12-18
2025-11-14 16:02:56,294 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2023-12-14' --> 'data\processed_data\COF\4_2023-12-14.md'
Converted 'data\edgar_documents\COF\4_2023-12-18' --> 'data\processed_data\COF\4_2023-12-18.md'


2025-11-14 16:02:56,383 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:56,384 - ERROR - Input document 4_2024-01-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:56,388 - INFO - Going to convert document batch...
2025-11-14 16:02:56,419 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:56,422 - ERROR - Input document 4_2024-01-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\COF\4_2024-01-29: File format not allowed: data\edgar_documents\COF\4_2024-01-29
Error processing data\edgar_documents\COF\4_2024-01-30: File format not allowed: data\edgar_documents\COF\4_2024-01-30


2025-11-14 16:02:56,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:56,645 - INFO - Going to convert document batch...
2025-11-14 16:02:56,647 - INFO - Processing document 4_2024-02-05
2025-11-14 16:02:56,692 - INFO - Finished converting document 4_2024-02-05 in 0.09 sec.
2025-11-14 16:02:56,760 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:56,761 - ERROR - Input document 4_2024-02-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02

Converted 'data\edgar_documents\COF\4_2024-02-02' --> 'data\processed_data\COF\4_2024-02-02.md'
Converted 'data\edgar_documents\COF\4_2024-02-05' --> 'data\processed_data\COF\4_2024-02-05.md'
Error processing data\edgar_documents\COF\4_2024-02-20: File format not allowed: data\edgar_documents\COF\4_2024-02-20


2025-11-14 16:02:56,793 - ERROR - Input document 4_2024-02-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:56,795 - INFO - Going to convert document batch...
2025-11-14 16:02:56,813 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:56,815 - ERROR - Input document 4_2024-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\COF\4_2024-02-22: File format not allowed: data\edgar_documents\COF\4_2024-02-22
Error processing data\edgar_documents\COF\4_2024-02-27: File format not allowed: data\edgar_documents\COF\4_2024-02-27
Error processing data\edgar_documents\COF\4_2024-03-06: File format not allowed: data\edgar_documents\COF\4_2024-03-06
Error processing data\edgar_documents\COF\4_2024-03-11: File format not allowed: data\edgar_documents\COF\4_2024-03-11


2025-11-14 16:02:57,079 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:57,082 - ERROR - Input document 4_2024-03-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:57,085 - INFO - Going to convert document batch...
2025-11-14 16:02:57,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:57,135 - INFO - Going to convert document batch...
2025-11-14 16:02:57,138 - INFO - Processing document 4_2024-04-03
2025-11-14 16:02:57,210 - INFO - Fin

Converted 'data\edgar_documents\COF\4_2024-03-13' --> 'data\processed_data\COF\4_2024-03-13.md'
Error processing data\edgar_documents\COF\4_2024-03-21: File format not allowed: data\edgar_documents\COF\4_2024-03-21
Converted 'data\edgar_documents\COF\4_2024-04-03' --> 'data\processed_data\COF\4_2024-04-03.md'


2025-11-14 16:02:57,275 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:57,276 - ERROR - Input document 4_2024-04-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:57,277 - INFO - Going to convert document batch...
2025-11-14 16:02:57,294 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:57,295 - ERROR - Input document 4_2024-04-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\COF\4_2024-04-22: File format not allowed: data\edgar_documents\COF\4_2024-04-22
Error processing data\edgar_documents\COF\4_2024-04-26: File format not allowed: data\edgar_documents\COF\4_2024-04-26
Converted 'data\edgar_documents\COF\4_2024-05-02' --> 'data\processed_data\COF\4_2024-05-02.md'


2025-11-14 16:02:57,475 - INFO - Processing document 4_2024-05-03
2025-11-14 16:02:57,534 - INFO - Finished converting document 4_2024-05-03 in 0.11 sec.
2025-11-14 16:02:57,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:57,607 - INFO - Going to convert document batch...
2025-11-14 16:02:57,609 - INFO - Processing document 4_2024-05-06
2025-11-14 16:02:57,687 - INFO - Finished converting document 4_2024-05-06 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2024-05-03' --> 'data\processed_data\COF\4_2024-05-03.md'


2025-11-14 16:02:57,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:57,805 - INFO - Going to convert document batch...
2025-11-14 16:02:57,806 - INFO - Processing document 4_2024-05-09
2025-11-14 16:02:57,844 - INFO - Finished converting document 4_2024-05-09 in 0.09 sec.
2025-11-14 16:02:57,908 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:57,908 - ERROR - Input document 4_2024-07-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02

Converted 'data\edgar_documents\COF\4_2024-05-06' --> 'data\processed_data\COF\4_2024-05-06.md'
Converted 'data\edgar_documents\COF\4_2024-05-09' --> 'data\processed_data\COF\4_2024-05-09.md'
Error processing data\edgar_documents\COF\4_2024-07-17: File format not allowed: data\edgar_documents\COF\4_2024-07-17


2025-11-14 16:02:57,953 - INFO - Processing document 4_2024-07-19
2025-11-14 16:02:58,003 - INFO - Finished converting document 4_2024-07-19 in 0.09 sec.
2025-11-14 16:02:58,089 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:58,091 - ERROR - Input document 4_2024-07-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:58,093 - INFO - Going to convert document batch...
2025-11-14 16:02:58,125 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\COF\4_2024-07-19' --> 'data\processed_data\COF\4_2024-07-19.md'
Error processing data\edgar_documents\COF\4_2024-07-24: File format not allowed: data\edgar_documents\COF\4_2024-07-24
Error processing data\edgar_documents\COF\4_2024-07-25: File format not allowed: data\edgar_documents\COF\4_2024-07-25


2025-11-14 16:02:58,269 - INFO - Finished converting document 4_2024-08-06 in 0.14 sec.
2025-11-14 16:02:58,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:58,397 - INFO - Going to convert document batch...
2025-11-14 16:02:58,399 - INFO - Processing document 4_2024-08-08
2025-11-14 16:02:58,496 - INFO - Finished converting document 4_2024-08-08 in 0.16 sec.


Converted 'data\edgar_documents\COF\4_2024-08-06' --> 'data\processed_data\COF\4_2024-08-06.md'


2025-11-14 16:02:58,582 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:58,583 - ERROR - Input document 4_2024-09-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:58,585 - INFO - Going to convert document batch...
2025-11-14 16:02:58,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:58,620 - INFO - Going to convert document batch...
2025-11-14 16:02:58,621 - INFO - Processing document 4_2024-10-21
2025-11-14 16:02:58,662 - INFO - Fin

Converted 'data\edgar_documents\COF\4_2024-08-08' --> 'data\processed_data\COF\4_2024-08-08.md'
Error processing data\edgar_documents\COF\4_2024-09-13: File format not allowed: data\edgar_documents\COF\4_2024-09-13
Converted 'data\edgar_documents\COF\4_2024-10-21' --> 'data\processed_data\COF\4_2024-10-21.md'
Error processing data\edgar_documents\COF\4_2024-10-25: File format not allowed: data\edgar_documents\COF\4_2024-10-25


2025-11-14 16:02:58,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:58,773 - INFO - Going to convert document batch...
2025-11-14 16:02:58,774 - INFO - Processing document 4_2024-11-07
2025-11-14 16:02:58,812 - INFO - Finished converting document 4_2024-11-07 in 0.08 sec.
2025-11-14 16:02:58,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:58,880 - INFO - Going to convert document batch...
2025-11-14 16:02:58,881 - INFO - Processing document 4_2024-11-12
2025-11-14 16:02:58,922 - INFO - Finished converting document 4_2024-11-12 in 0.08 sec.
2025-11-14 16:02:58,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:59,010 - INFO - Going to convert document batch...
2025-11-14 16:02:59,012 - INFO - Processing document 4_2024-11-13


Converted 'data\edgar_documents\COF\4_2024-11-07' --> 'data\processed_data\COF\4_2024-11-07.md'
Converted 'data\edgar_documents\COF\4_2024-11-12' --> 'data\processed_data\COF\4_2024-11-12.md'


2025-11-14 16:02:59,050 - INFO - Finished converting document 4_2024-11-13 in 0.08 sec.
2025-11-14 16:02:59,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:59,141 - INFO - Going to convert document batch...
2025-11-14 16:02:59,143 - INFO - Processing document 4_2024-11-14
2025-11-14 16:02:59,213 - INFO - Finished converting document 4_2024-11-14 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2024-11-13' --> 'data\processed_data\COF\4_2024-11-13.md'


2025-11-14 16:02:59,310 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:59,312 - ERROR - Input document 4_2024-12-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:59,317 - INFO - Going to convert document batch...
2025-11-14 16:02:59,341 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:59,344 - ERROR - Input document 4_2024-12-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\COF\4_2024-11-14' --> 'data\processed_data\COF\4_2024-11-14.md'
Error processing data\edgar_documents\COF\4_2024-12-17: File format not allowed: data\edgar_documents\COF\4_2024-12-17
Error processing data\edgar_documents\COF\4_2024-12-19: File format not allowed: data\edgar_documents\COF\4_2024-12-19
Error processing data\edgar_documents\COF\4_2025-01-06: File format not allowed: data\edgar_documents\COF\4_2025-01-06
Error processing data\edgar_documents\COF\4_2025-01-23: File format not allowed: data\edgar_documents\COF\4_2025-01-23


2025-11-14 16:02:59,578 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:59,579 - ERROR - Input document 4_2025-01-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:59,586 - INFO - Going to convert document batch...
2025-11-14 16:02:59,614 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:59,615 - ERROR - Input document 4_2025-01-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\COF\4_2025-01-24: File format not allowed: data\edgar_documents\COF\4_2025-01-24
Error processing data\edgar_documents\COF\4_2025-01-28: File format not allowed: data\edgar_documents\COF\4_2025-01-28
Error processing data\edgar_documents\COF\4_2025-01-29: File format not allowed: data\edgar_documents\COF\4_2025-01-29


2025-11-14 16:02:59,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:59,869 - INFO - Going to convert document batch...
2025-11-14 16:02:59,871 - INFO - Processing document 4_2025-02-06
2025-11-14 16:02:59,936 - INFO - Finished converting document 4_2025-02-06 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2025-02-04' --> 'data\processed_data\COF\4_2025-02-04.md'
Converted 'data\edgar_documents\COF\4_2025-02-06' --> 'data\processed_data\COF\4_2025-02-06.md'


2025-11-14 16:03:00,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,066 - INFO - Going to convert document batch...
2025-11-14 16:03:00,071 - INFO - Processing document 4_2025-02-10
2025-11-14 16:03:00,127 - INFO - Finished converting document 4_2025-02-10 in 0.14 sec.
2025-11-14 16:03:00,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,197 - INFO - Going to convert document batch...
2025-11-14 16:03:00,199 - INFO - Processing document 4_2025-02-19
2025-11-14 16:03:00,239 - INFO - Finished converting document 4_2025-02-19 in 0.08 sec.
2025-11-14 16:03:00,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,349 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\4_2025-02-10' --> 'data\processed_data\COF\4_2025-02-10.md'
Converted 'data\edgar_documents\COF\4_2025-02-19' --> 'data\processed_data\COF\4_2025-02-19.md'


2025-11-14 16:03:00,351 - INFO - Processing document 4_2025-03-12
2025-11-14 16:03:00,403 - INFO - Finished converting document 4_2025-03-12 in 0.09 sec.
2025-11-14 16:03:00,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,484 - INFO - Going to convert document batch...
2025-11-14 16:03:00,486 - INFO - Processing document 4_2025-05-12
2025-11-14 16:03:00,522 - INFO - Finished converting document 4_2025-05-12 in 0.06 sec.
2025-11-14 16:03:00,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,604 - INFO - Going to convert document batch...
2025-11-14 16:03:00,605 - INFO - Processing document 4_2025-05-14


Converted 'data\edgar_documents\COF\4_2025-03-12' --> 'data\processed_data\COF\4_2025-03-12.md'
Converted 'data\edgar_documents\COF\4_2025-05-12' --> 'data\processed_data\COF\4_2025-05-12.md'


2025-11-14 16:03:00,647 - INFO - Finished converting document 4_2025-05-14 in 0.08 sec.
2025-11-14 16:03:00,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,723 - INFO - Going to convert document batch...
2025-11-14 16:03:00,724 - INFO - Processing document 4_2025-05-20
2025-11-14 16:03:00,760 - INFO - Finished converting document 4_2025-05-20 in 0.08 sec.
2025-11-14 16:03:00,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,826 - INFO - Going to convert document batch...
2025-11-14 16:03:00,827 - INFO - Processing document 4_2025-06-05
2025-11-14 16:03:00,860 - INFO - Finished converting document 4_2025-06-05 in 0.06 sec.


Converted 'data\edgar_documents\COF\4_2025-05-14' --> 'data\processed_data\COF\4_2025-05-14.md'
Converted 'data\edgar_documents\COF\4_2025-05-20' --> 'data\processed_data\COF\4_2025-05-20.md'


2025-11-14 16:03:00,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,936 - INFO - Going to convert document batch...
2025-11-14 16:03:00,937 - INFO - Processing document 4_2025-07-25
2025-11-14 16:03:00,972 - INFO - Finished converting document 4_2025-07-25 in 0.08 sec.
2025-11-14 16:03:01,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,057 - INFO - Going to convert document batch...
2025-11-14 16:03:01,059 - INFO - Processing document 4_2025-08-05


Converted 'data\edgar_documents\COF\4_2025-06-05' --> 'data\processed_data\COF\4_2025-06-05.md'
Converted 'data\edgar_documents\COF\4_2025-07-25' --> 'data\processed_data\COF\4_2025-07-25.md'


2025-11-14 16:03:01,149 - INFO - Finished converting document 4_2025-08-05 in 0.12 sec.
2025-11-14 16:03:01,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,235 - INFO - Going to convert document batch...
2025-11-14 16:03:01,236 - INFO - Processing document 4_2025-08-06
2025-11-14 16:03:01,275 - INFO - Finished converting document 4_2025-08-06 in 0.06 sec.
2025-11-14 16:03:01,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,354 - INFO - Going to convert document batch...
2025-11-14 16:03:01,356 - INFO - Processing document 4_2025-08-13
2025-11-14 16:03:01,399 - INFO - Finished converting document 4_2025-08-13 in 0.08 sec.


Converted 'data\edgar_documents\COF\4_2025-08-05' --> 'data\processed_data\COF\4_2025-08-05.md'
Converted 'data\edgar_documents\COF\4_2025-08-06' --> 'data\processed_data\COF\4_2025-08-06.md'


2025-11-14 16:03:01,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,490 - INFO - Going to convert document batch...
2025-11-14 16:03:01,491 - INFO - Processing document 4_2025-08-20
2025-11-14 16:03:01,527 - INFO - Finished converting document 4_2025-08-20 in 0.08 sec.
2025-11-14 16:03:01,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,588 - INFO - Going to convert document batch...
2025-11-14 16:03:01,591 - INFO - Processing document 4_2025-09-03
2025-11-14 16:03:01,633 - INFO - Finished converting document 4_2025-09-03 in 0.06 sec.


Converted 'data\edgar_documents\COF\4_2025-08-13' --> 'data\processed_data\COF\4_2025-08-13.md'
Converted 'data\edgar_documents\COF\4_2025-08-20' --> 'data\processed_data\COF\4_2025-08-20.md'


2025-11-14 16:03:01,755 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:03:01,757 - ERROR - Input document 4_2025-09-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:03:01,761 - INFO - Going to convert document batch...
2025-11-14 16:03:01,788 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:03:01,789 - ERROR - Input document 4_2025-09-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\COF\4_2025-09-03' --> 'data\processed_data\COF\4_2025-09-03.md'
Error processing data\edgar_documents\COF\4_2025-09-08: File format not allowed: data\edgar_documents\COF\4_2025-09-08
Error processing data\edgar_documents\COF\4_2025-09-10: File format not allowed: data\edgar_documents\COF\4_2025-09-10


2025-11-14 16:03:01,903 - INFO - Finished converting document 4_2025-10-03 in 0.11 sec.
2025-11-14 16:03:01,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:02,005 - INFO - Going to convert document batch...
2025-11-14 16:03:02,006 - INFO - Processing document 4_2025-10-29
2025-11-14 16:03:02,100 - INFO - Finished converting document 4_2025-10-29 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2025-10-03' --> 'data\processed_data\COF\4_2025-10-03.md'


2025-11-14 16:03:02,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:02,254 - INFO - Going to convert document batch...
2025-11-14 16:03:02,255 - INFO - Processing document 4_2025-11-06
2025-11-14 16:03:02,292 - INFO - Finished converting document 4_2025-11-06 in 0.11 sec.
2025-11-14 16:03:02,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\4_2025-10-29' --> 'data\processed_data\COF\4_2025-10-29.md'
Converted 'data\edgar_documents\COF\4_2025-11-06' --> 'data\processed_data\COF\4_2025-11-06.md'


2025-11-14 16:03:02,383 - INFO - Going to convert document batch...
2025-11-14 16:03:02,386 - INFO - Processing document 4_2025-11-07
2025-11-14 16:03:02,451 - INFO - Finished converting document 4_2025-11-07 in 0.12 sec.
2025-11-14 16:03:02,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:02,553 - INFO - Going to convert document batch...
2025-11-14 16:03:02,554 - INFO - Processing document 8-K_2023-01-24
2025-11-14 16:03:02,619 - INFO - Finished converting document 8-K_2023-01-24 in 0.12 sec.
2025-11-14 16:03:02,680 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\4_2025-11-07' --> 'data\processed_data\COF\4_2025-11-07.md'
Converted 'data\edgar_documents\COF\8-K_2023-01-24' --> 'data\processed_data\COF\8-K_2023-01-24.md'


2025-11-14 16:03:02,733 - INFO - Going to convert document batch...
2025-11-14 16:03:02,734 - INFO - Processing document 8-K_2023-01-30
2025-11-14 16:03:02,776 - INFO - Finished converting document 8-K_2023-01-30 in 0.14 sec.
2025-11-14 16:03:02,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:02,915 - INFO - Going to convert document batch...
2025-11-14 16:03:02,916 - INFO - Processing document 8-K_2023-01-31
2025-11-14 16:03:02,970 - INFO - Finished converting document 8-K_2023-01-31 in 0.17 sec.


Converted 'data\edgar_documents\COF\8-K_2023-01-30' --> 'data\processed_data\COF\8-K_2023-01-30.md'


2025-11-14 16:03:03,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,033 - INFO - Going to convert document batch...
2025-11-14 16:03:03,034 - INFO - Processing document 8-K_2023-02-01
2025-11-14 16:03:03,084 - INFO - Finished converting document 8-K_2023-02-01 in 0.09 sec.
2025-11-14 16:03:03,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,171 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2023-01-31' --> 'data\processed_data\COF\8-K_2023-01-31.md'
Converted 'data\edgar_documents\COF\8-K_2023-02-01' --> 'data\processed_data\COF\8-K_2023-02-01.md'


2025-11-14 16:03:03,173 - INFO - Processing document 8-K_2023-02-13
2025-11-14 16:03:03,228 - INFO - Finished converting document 8-K_2023-02-13 in 0.11 sec.
2025-11-14 16:03:03,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,317 - INFO - Going to convert document batch...
2025-11-14 16:03:03,319 - INFO - Processing document 8-K_2023-02-15
2025-11-14 16:03:03,377 - INFO - Finished converting document 8-K_2023-02-15 in 0.12 sec.


Converted 'data\edgar_documents\COF\8-K_2023-02-13' --> 'data\processed_data\COF\8-K_2023-02-13.md'
Converted 'data\edgar_documents\COF\8-K_2023-02-15' --> 'data\processed_data\COF\8-K_2023-02-15.md'


2025-11-14 16:03:03,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,503 - INFO - Going to convert document batch...
2025-11-14 16:03:03,504 - INFO - Processing document 8-K_2023-02-16
2025-11-14 16:03:03,546 - INFO - Finished converting document 8-K_2023-02-16 in 0.14 sec.
2025-11-14 16:03:03,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,644 - INFO - Going to convert document batch...
2025-11-14 16:03:03,645 - INFO - Processing document 8-K_2023-03-07
2025-11-14 16:03:03,693 - INFO - Finished converting document 8-K_2023-03-07 in 0.12 sec.
2025-11-14 16:03:03,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-02-16' --> 'data\processed_data\COF\8-K_2023-02-16.md'
Converted 'data\edgar_documents\COF\8-K_2023-03-07' --> 'data\processed_data\COF\8-K_2023-03-07.md'


2025-11-14 16:03:03,804 - INFO - Going to convert document batch...
2025-11-14 16:03:03,805 - INFO - Processing document 8-K_2023-03-15
2025-11-14 16:03:03,848 - INFO - Finished converting document 8-K_2023-03-15 in 0.12 sec.
2025-11-14 16:03:03,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,910 - INFO - Going to convert document batch...
2025-11-14 16:03:03,911 - INFO - Processing document 8-K_2023-04-07
2025-11-14 16:03:03,977 - INFO - Finished converting document 8-K_2023-04-07 in 0.11 sec.
2025-11-14 16:03:04,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-03-15' --> 'data\processed_data\COF\8-K_2023-03-15.md'
Converted 'data\edgar_documents\COF\8-K_2023-04-07' --> 'data\processed_data\COF\8-K_2023-04-07.md'


2025-11-14 16:03:04,080 - INFO - Going to convert document batch...
2025-11-14 16:03:04,081 - INFO - Processing document 8-K_2023-04-27
2025-11-14 16:03:04,114 - INFO - Finished converting document 8-K_2023-04-27 in 0.09 sec.
2025-11-14 16:03:04,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,189 - INFO - Going to convert document batch...
2025-11-14 16:03:04,191 - INFO - Processing document 8-K_2023-05-08
2025-11-14 16:03:04,240 - INFO - Finished converting document 8-K_2023-05-08 in 0.09 sec.
2025-11-14 16:03:04,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,335 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2023-04-27' --> 'data\processed_data\COF\8-K_2023-04-27.md'
Converted 'data\edgar_documents\COF\8-K_2023-05-08' --> 'data\processed_data\COF\8-K_2023-05-08.md'


2025-11-14 16:03:04,337 - INFO - Processing document 8-K_2023-05-09
2025-11-14 16:03:04,403 - INFO - Finished converting document 8-K_2023-05-09 in 0.16 sec.
2025-11-14 16:03:04,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,523 - INFO - Going to convert document batch...
2025-11-14 16:03:04,524 - INFO - Processing document 8-K_2023-05-12
2025-11-14 16:03:04,561 - INFO - Finished converting document 8-K_2023-05-12 in 0.14 sec.


Converted 'data\edgar_documents\COF\8-K_2023-05-09' --> 'data\processed_data\COF\8-K_2023-05-09.md'
Converted 'data\edgar_documents\COF\8-K_2023-05-12' --> 'data\processed_data\COF\8-K_2023-05-12.md'


2025-11-14 16:03:04,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,669 - INFO - Going to convert document batch...
2025-11-14 16:03:04,671 - INFO - Processing document 8-K_2023-06-08
2025-11-14 16:03:04,750 - INFO - Finished converting document 8-K_2023-06-08 in 0.17 sec.
2025-11-14 16:03:04,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,860 - INFO - Going to convert document batch...
2025-11-14 16:03:04,862 - INFO - Processing document 8-K_2023-06-12
2025-11-14 16:03:04,929 - INFO - Finished converting document 8-K_2023-06-12 in 0.12 sec.
2025-11-14 16:03:04,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-06-08' --> 'data\processed_data\COF\8-K_2023-06-08.md'
Converted 'data\edgar_documents\COF\8-K_2023-06-12' --> 'data\processed_data\COF\8-K_2023-06-12.md'


2025-11-14 16:03:05,056 - INFO - Going to convert document batch...
2025-11-14 16:03:05,057 - INFO - Processing document 8-K_2023-06-15
2025-11-14 16:03:05,096 - INFO - Finished converting document 8-K_2023-06-15 in 0.14 sec.
2025-11-14 16:03:05,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,195 - INFO - Going to convert document batch...
2025-11-14 16:03:05,195 - INFO - Processing document 8-K_2023-06-30
2025-11-14 16:03:05,229 - INFO - Finished converting document 8-K_2023-06-30 in 0.09 sec.
2025-11-14 16:03:05,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-06-15' --> 'data\processed_data\COF\8-K_2023-06-15.md'
Converted 'data\edgar_documents\COF\8-K_2023-06-30' --> 'data\processed_data\COF\8-K_2023-06-30.md'


2025-11-14 16:03:05,342 - INFO - Going to convert document batch...
2025-11-14 16:03:05,343 - INFO - Processing document 8-K_2023-07-20
2025-11-14 16:03:05,402 - INFO - Finished converting document 8-K_2023-07-20 in 0.16 sec.
2025-11-14 16:03:05,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,472 - INFO - Going to convert document batch...
2025-11-14 16:03:05,473 - INFO - Processing document 8-K_2023-07-26
2025-11-14 16:03:05,512 - INFO - Finished converting document 8-K_2023-07-26 in 0.09 sec.
2025-11-14 16:03:05,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,611 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2023-07-20' --> 'data\processed_data\COF\8-K_2023-07-20.md'
Converted 'data\edgar_documents\COF\8-K_2023-07-26' --> 'data\processed_data\COF\8-K_2023-07-26.md'


2025-11-14 16:03:05,613 - INFO - Processing document 8-K_2023-08-15
2025-11-14 16:03:05,681 - INFO - Finished converting document 8-K_2023-08-15 in 0.14 sec.
2025-11-14 16:03:05,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,757 - INFO - Going to convert document batch...
2025-11-14 16:03:05,758 - INFO - Processing document 8-K_2023-09-08
2025-11-14 16:03:05,795 - INFO - Finished converting document 8-K_2023-09-08 in 0.09 sec.
2025-11-14 16:03:05,848 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,892 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2023-08-15' --> 'data\processed_data\COF\8-K_2023-08-15.md'
Converted 'data\edgar_documents\COF\8-K_2023-09-08' --> 'data\processed_data\COF\8-K_2023-09-08.md'


2025-11-14 16:03:05,893 - INFO - Processing document 8-K_2023-09-15
2025-11-14 16:03:05,932 - INFO - Finished converting document 8-K_2023-09-15 in 0.11 sec.
2025-11-14 16:03:05,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,009 - INFO - Going to convert document batch...
2025-11-14 16:03:06,010 - INFO - Processing document 8-K_2023-10-26
2025-11-14 16:03:06,045 - INFO - Finished converting document 8-K_2023-10-26 in 0.09 sec.
2025-11-14 16:03:06,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,108 - INFO - Going to convert document batch...
2025-11-14 16:03:06,110 - INFO - Processing document 8-K_2023-11-01


Converted 'data\edgar_documents\COF\8-K_2023-09-15' --> 'data\processed_data\COF\8-K_2023-09-15.md'
Converted 'data\edgar_documents\COF\8-K_2023-10-26' --> 'data\processed_data\COF\8-K_2023-10-26.md'


2025-11-14 16:03:06,210 - INFO - Finished converting document 8-K_2023-11-01 in 0.14 sec.
2025-11-14 16:03:06,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,344 - INFO - Going to convert document batch...
2025-11-14 16:03:06,347 - INFO - Processing document 8-K_2023-11-15
2025-11-14 16:03:06,388 - INFO - Finished converting document 8-K_2023-11-15 in 0.12 sec.
2025-11-14 16:03:06,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-11-01' --> 'data\processed_data\COF\8-K_2023-11-01.md'
Converted 'data\edgar_documents\COF\8-K_2023-11-15' --> 'data\processed_data\COF\8-K_2023-11-15.md'


2025-11-14 16:03:06,468 - INFO - Going to convert document batch...
2025-11-14 16:03:06,469 - INFO - Processing document 8-K_2023-12-04
2025-11-14 16:03:06,508 - INFO - Finished converting document 8-K_2023-12-04 in 0.09 sec.
2025-11-14 16:03:06,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,569 - INFO - Going to convert document batch...
2025-11-14 16:03:06,570 - INFO - Processing document 8-K_2023-12-15
2025-11-14 16:03:06,625 - INFO - Finished converting document 8-K_2023-12-15 in 0.09 sec.
2025-11-14 16:03:06,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,710 - INFO - Going to convert document batch...
2025-11-14 16:03:06,711 - INFO - Processing document 8-K_2024-01-25
2025-11-14 16:03:06,744 - INFO - Finished converting document 8-K_2024-01-25 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2023-12-04' --> 'data\processed_data\COF\8-K_2023-12-04.md'
Converted 'data\edgar_documents\COF\8-K_2023-12-15' --> 'data\processed_data\COF\8-K_2023-12-15.md'


2025-11-14 16:03:06,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,813 - INFO - Going to convert document batch...
2025-11-14 16:03:06,815 - INFO - Processing document 8-K_2024-02-01
2025-11-14 16:03:06,872 - INFO - Finished converting document 8-K_2024-02-01 in 0.11 sec.
2025-11-14 16:03:06,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,954 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2024-01-25' --> 'data\processed_data\COF\8-K_2024-01-25.md'
Converted 'data\edgar_documents\COF\8-K_2024-02-01' --> 'data\processed_data\COF\8-K_2024-02-01.md'


2025-11-14 16:03:06,955 - INFO - Processing document 8-K_2024-02-05
2025-11-14 16:03:07,016 - INFO - Finished converting document 8-K_2024-02-05 in 0.12 sec.
2025-11-14 16:03:07,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:07,116 - INFO - Going to convert document batch...
2025-11-14 16:03:07,118 - INFO - Processing document 8-K_2024-02-15
2025-11-14 16:03:07,167 - INFO - Finished converting document 8-K_2024-02-15 in 0.12 sec.


Converted 'data\edgar_documents\COF\8-K_2024-02-05' --> 'data\processed_data\COF\8-K_2024-02-05.md'
Converted 'data\edgar_documents\COF\8-K_2024-02-15' --> 'data\processed_data\COF\8-K_2024-02-15.md'


2025-11-14 16:03:07,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:07,275 - INFO - Going to convert document batch...
2025-11-14 16:03:07,276 - INFO - Processing document 8-K_2024-02-20
2025-11-14 16:03:07,334 - INFO - Finished converting document 8-K_2024-02-20 in 0.12 sec.
2025-11-14 16:03:07,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:07,439 - INFO - Going to convert document batch...
2025-11-14 16:03:07,442 - INFO - Processing document 8-K_2024-02-22


Converted 'data\edgar_documents\COF\8-K_2024-02-20' --> 'data\processed_data\COF\8-K_2024-02-20.md'


2025-11-14 16:03:07,576 - INFO - Finished converting document 8-K_2024-02-22 in 0.22 sec.
2025-11-14 16:03:07,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2024-02-22' --> 'data\processed_data\COF\8-K_2024-02-22.md'


2025-11-14 16:03:09,198 - INFO - Going to convert document batch...
2025-11-14 16:03:09,199 - INFO - Processing document 8-K_2024-02-26
2025-11-14 16:03:09,235 - INFO - Finished converting document 8-K_2024-02-26 in 1.62 sec.
2025-11-14 16:03:09,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,296 - INFO - Going to convert document batch...
2025-11-14 16:03:09,298 - INFO - Processing document 8-K_2024-02-29
2025-11-14 16:03:09,334 - INFO - Finished converting document 8-K_2024-02-29 in 0.08 sec.
2025-11-14 16:03:09,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,413 - INFO - Going to convert document batch...
2025-11-14 16:03:09,415 - INFO - Processing document 8-K_2024-03-04


Converted 'data\edgar_documents\COF\8-K_2024-02-26' --> 'data\processed_data\COF\8-K_2024-02-26.md'
Converted 'data\edgar_documents\COF\8-K_2024-02-29' --> 'data\processed_data\COF\8-K_2024-02-29.md'


2025-11-14 16:03:09,454 - INFO - Finished converting document 8-K_2024-03-04 in 0.11 sec.
2025-11-14 16:03:09,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,530 - INFO - Going to convert document batch...
2025-11-14 16:03:09,533 - INFO - Processing document 8-K_2024-03-11
2025-11-14 16:03:09,581 - INFO - Finished converting document 8-K_2024-03-11 in 0.11 sec.
2025-11-14 16:03:09,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,682 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2024-03-04' --> 'data\processed_data\COF\8-K_2024-03-04.md'
Converted 'data\edgar_documents\COF\8-K_2024-03-11' --> 'data\processed_data\COF\8-K_2024-03-11.md'


2025-11-14 16:03:09,684 - INFO - Processing document 8-K_2024-03-15
2025-11-14 16:03:09,747 - INFO - Finished converting document 8-K_2024-03-15 in 0.14 sec.
2025-11-14 16:03:09,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,832 - INFO - Going to convert document batch...
2025-11-14 16:03:09,834 - INFO - Processing document 8-K_2024-04-25
2025-11-14 16:03:09,898 - INFO - Finished converting document 8-K_2024-04-25 in 0.12 sec.
2025-11-14 16:03:09,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2024-03-15' --> 'data\processed_data\COF\8-K_2024-03-15.md'
Converted 'data\edgar_documents\COF\8-K_2024-04-25' --> 'data\processed_data\COF\8-K_2024-04-25.md'


2025-11-14 16:03:10,002 - INFO - Going to convert document batch...
2025-11-14 16:03:10,003 - INFO - Processing document 8-K_2024-05-03
2025-11-14 16:03:10,080 - INFO - Finished converting document 8-K_2024-05-03 in 0.16 sec.
2025-11-14 16:03:10,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,176 - INFO - Going to convert document batch...
2025-11-14 16:03:10,177 - INFO - Processing document 8-K_2024-05-15
2025-11-14 16:03:10,209 - INFO - Finished converting document 8-K_2024-05-15 in 0.08 sec.
2025-11-14 16:03:10,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,302 - INFO - Going to convert document batch...
2025-11-14 16:03:10,304 - INFO - Processing document 8-K_2024-05-24


Converted 'data\edgar_documents\COF\8-K_2024-05-03' --> 'data\processed_data\COF\8-K_2024-05-03.md'
Converted 'data\edgar_documents\COF\8-K_2024-05-15' --> 'data\processed_data\COF\8-K_2024-05-15.md'


2025-11-14 16:03:10,352 - INFO - Finished converting document 8-K_2024-05-24 in 0.12 sec.
2025-11-14 16:03:10,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,440 - INFO - Going to convert document batch...
2025-11-14 16:03:10,442 - INFO - Processing document 8-K_2024-06-10
2025-11-14 16:03:10,492 - INFO - Finished converting document 8-K_2024-06-10 in 0.11 sec.
2025-11-14 16:03:10,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,562 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2024-05-24' --> 'data\processed_data\COF\8-K_2024-05-24.md'
Converted 'data\edgar_documents\COF\8-K_2024-06-10' --> 'data\processed_data\COF\8-K_2024-06-10.md'


2025-11-14 16:03:10,564 - INFO - Processing document 8-K_2024-06-17
2025-11-14 16:03:10,604 - INFO - Finished converting document 8-K_2024-06-17 in 0.09 sec.
2025-11-14 16:03:10,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,670 - INFO - Going to convert document batch...
2025-11-14 16:03:10,671 - INFO - Processing document 8-K_2024-06-28
2025-11-14 16:03:10,705 - INFO - Finished converting document 8-K_2024-06-28 in 0.08 sec.
2025-11-14 16:03:10,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,802 - INFO - Going to convert document batch...
2025-11-14 16:03:10,803 - INFO - Processing document 8-K_2024-07-23


Converted 'data\edgar_documents\COF\8-K_2024-06-17' --> 'data\processed_data\COF\8-K_2024-06-17.md'
Converted 'data\edgar_documents\COF\8-K_2024-06-28' --> 'data\processed_data\COF\8-K_2024-06-28.md'


2025-11-14 16:03:10,852 - INFO - Finished converting document 8-K_2024-07-23 in 0.12 sec.
2025-11-14 16:03:10,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,932 - INFO - Going to convert document batch...
2025-11-14 16:03:10,933 - INFO - Processing document 8-K_2024-07-24
2025-11-14 16:03:10,979 - INFO - Finished converting document 8-K_2024-07-24 in 0.11 sec.
2025-11-14 16:03:11,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,070 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2024-07-23' --> 'data\processed_data\COF\8-K_2024-07-23.md'
Converted 'data\edgar_documents\COF\8-K_2024-07-24' --> 'data\processed_data\COF\8-K_2024-07-24.md'


2025-11-14 16:03:11,071 - INFO - Processing document 8-K_2024-07-26
2025-11-14 16:03:11,128 - INFO - Finished converting document 8-K_2024-07-26 in 0.12 sec.
2025-11-14 16:03:11,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,205 - INFO - Going to convert document batch...
2025-11-14 16:03:11,206 - INFO - Processing document 8-K_2024-08-15
2025-11-14 16:03:11,249 - INFO - Finished converting document 8-K_2024-08-15 in 0.09 sec.
2025-11-14 16:03:11,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,323 - INFO - Going to convert document batch...
2025-11-14 16:03:11,324 - INFO - Processing document 8-K_2024-09-09
2025-11-14 16:03:11,357 - INFO - Finished converting document 8-K_2024-09-09 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2024-07-26' --> 'data\processed_data\COF\8-K_2024-07-26.md'
Converted 'data\edgar_documents\COF\8-K_2024-08-15' --> 'data\processed_data\COF\8-K_2024-08-15.md'


2025-11-14 16:03:11,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,417 - INFO - Going to convert document batch...
2025-11-14 16:03:11,418 - INFO - Processing document 8-K_2024-09-16
2025-11-14 16:03:11,451 - INFO - Finished converting document 8-K_2024-09-16 in 0.08 sec.
2025-11-14 16:03:11,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,524 - INFO - Going to convert document batch...
2025-11-14 16:03:11,525 - INFO - Processing document 8-K_2024-10-24


Converted 'data\edgar_documents\COF\8-K_2024-09-09' --> 'data\processed_data\COF\8-K_2024-09-09.md'
Converted 'data\edgar_documents\COF\8-K_2024-09-16' --> 'data\processed_data\COF\8-K_2024-09-16.md'


2025-11-14 16:03:11,562 - INFO - Finished converting document 8-K_2024-10-24 in 0.09 sec.
2025-11-14 16:03:11,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,621 - INFO - Going to convert document batch...
2025-11-14 16:03:11,622 - INFO - Processing document 8-K_2024-11-15
2025-11-14 16:03:11,658 - INFO - Finished converting document 8-K_2024-11-15 in 0.08 sec.
2025-11-14 16:03:11,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,717 - INFO - Going to convert document batch...
2025-11-14 16:03:11,718 - INFO - Processing document 8-K_2024-12-09
2025-11-14 16:03:11,752 - INFO - Finished converting document 8-K_2024-12-09 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2024-10-24' --> 'data\processed_data\COF\8-K_2024-10-24.md'
Converted 'data\edgar_documents\COF\8-K_2024-11-15' --> 'data\processed_data\COF\8-K_2024-11-15.md'


2025-11-14 16:03:11,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,813 - INFO - Going to convert document batch...
2025-11-14 16:03:11,814 - INFO - Processing document 8-K_2024-12-16
2025-11-14 16:03:11,850 - INFO - Finished converting document 8-K_2024-12-16 in 0.08 sec.
2025-11-14 16:03:11,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,930 - INFO - Going to convert document batch...
2025-11-14 16:03:11,931 - INFO - Processing document 8-K_2025-01-21
2025-11-14 16:03:11,963 - INFO - Finished converting document 8-K_2025-01-21 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2024-12-09' --> 'data\processed_data\COF\8-K_2024-12-09.md'
Converted 'data\edgar_documents\COF\8-K_2024-12-16' --> 'data\processed_data\COF\8-K_2024-12-16.md'


2025-11-14 16:03:11,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,032 - INFO - Going to convert document batch...
2025-11-14 16:03:12,034 - INFO - Processing document 8-K_2025-01-24
2025-11-14 16:03:12,122 - INFO - Finished converting document 8-K_2025-01-24 in 0.14 sec.


Converted 'data\edgar_documents\COF\8-K_2025-01-21' --> 'data\processed_data\COF\8-K_2025-01-21.md'
Converted 'data\edgar_documents\COF\8-K_2025-01-24' --> 'data\processed_data\COF\8-K_2025-01-24.md'


2025-11-14 16:03:12,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,216 - INFO - Going to convert document batch...
2025-11-14 16:03:12,218 - INFO - Processing document 8-K_2025-01-30
2025-11-14 16:03:12,263 - INFO - Finished converting document 8-K_2025-01-30 in 0.11 sec.
2025-11-14 16:03:12,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,333 - INFO - Going to convert document batch...
2025-11-14 16:03:12,334 - INFO - Processing document 8-K_2025-02-07
2025-11-14 16:03:12,371 - INFO - Finished converting document 8-K_2025-02-07 in 0.08 sec.
2025-11-14 16:03:12,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,438 - INFO - Going to convert document batch...
2025-11-14 16:03:12,439 - INFO - Processing document 8-K_2025-02-10
2025-11-14 16:03:12,483 - INFO - Finished converting document 8-K_2025-02-10 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2025-01-30' --> 'data\processed_data\COF\8-K_2025-01-30.md'
Converted 'data\edgar_documents\COF\8-K_2025-02-07' --> 'data\processed_data\COF\8-K_2025-02-07.md'


2025-11-14 16:03:12,521 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,558 - INFO - Going to convert document batch...
2025-11-14 16:03:12,560 - INFO - Processing document 8-K_2025-02-18
2025-11-14 16:03:12,612 - INFO - Finished converting document 8-K_2025-02-18 in 0.11 sec.
2025-11-14 16:03:12,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,669 - INFO - Going to convert document batch...
2025-11-14 16:03:12,671 - INFO - Processing document 8-K_2025-03-17


Converted 'data\edgar_documents\COF\8-K_2025-02-10' --> 'data\processed_data\COF\8-K_2025-02-10.md'
Converted 'data\edgar_documents\COF\8-K_2025-02-18' --> 'data\processed_data\COF\8-K_2025-02-18.md'


2025-11-14 16:03:12,715 - INFO - Finished converting document 8-K_2025-03-17 in 0.09 sec.
2025-11-14 16:03:12,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,780 - INFO - Going to convert document batch...
2025-11-14 16:03:12,782 - INFO - Processing document 8-K_2025-04-18
2025-11-14 16:03:12,817 - INFO - Finished converting document 8-K_2025-04-18 in 0.08 sec.
2025-11-14 16:03:12,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,882 - INFO - Going to convert document batch...
2025-11-14 16:03:12,884 - INFO - Processing document 8-K_2025-04-22
2025-11-14 16:03:12,925 - INFO - Finished converting document 8-K_2025-04-22 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2025-03-17' --> 'data\processed_data\COF\8-K_2025-03-17.md'
Converted 'data\edgar_documents\COF\8-K_2025-04-18' --> 'data\processed_data\COF\8-K_2025-04-18.md'


2025-11-14 16:03:12,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,025 - INFO - Going to convert document batch...
2025-11-14 16:03:13,026 - INFO - Processing document 8-K_2025-05-08
2025-11-14 16:03:13,092 - INFO - Finished converting document 8-K_2025-05-08 in 0.14 sec.
2025-11-14 16:03:13,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2025-04-22' --> 'data\processed_data\COF\8-K_2025-04-22.md'
Converted 'data\edgar_documents\COF\8-K_2025-05-08' --> 'data\processed_data\COF\8-K_2025-05-08.md'


2025-11-14 16:03:13,156 - INFO - Going to convert document batch...
2025-11-14 16:03:13,158 - INFO - Processing document 8-K_2025-05-15
2025-11-14 16:03:13,191 - INFO - Finished converting document 8-K_2025-05-15 in 0.06 sec.
2025-11-14 16:03:13,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,264 - INFO - Going to convert document batch...
2025-11-14 16:03:13,266 - INFO - Processing document 8-K_2025-05-19
2025-11-14 16:03:13,324 - INFO - Finished converting document 8-K_2025-05-19 in 0.12 sec.


Converted 'data\edgar_documents\COF\8-K_2025-05-15' --> 'data\processed_data\COF\8-K_2025-05-15.md'
Converted 'data\edgar_documents\COF\8-K_2025-05-19' --> 'data\processed_data\COF\8-K_2025-05-19.md'


2025-11-14 16:03:13,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,444 - INFO - Going to convert document batch...
2025-11-14 16:03:13,447 - INFO - Processing document 8-K_2025-05-22
2025-11-14 16:03:13,508 - INFO - Finished converting document 8-K_2025-05-22 in 0.12 sec.
2025-11-14 16:03:13,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,604 - INFO - Going to convert document batch...
2025-11-14 16:03:13,605 - INFO - Processing document 8-K_2025-06-05
2025-11-14 16:03:13,642 - INFO - Finished converting document 8-K_2025-06-05 in 0.09 sec.
2025-11-14 16:03:13,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2025-05-22' --> 'data\processed_data\COF\8-K_2025-05-22.md'
Converted 'data\edgar_documents\COF\8-K_2025-06-05' --> 'data\processed_data\COF\8-K_2025-06-05.md'


2025-11-14 16:03:13,736 - INFO - Going to convert document batch...
2025-11-14 16:03:13,738 - INFO - Processing document 8-K_2025-06-09
2025-11-14 16:03:13,795 - INFO - Finished converting document 8-K_2025-06-09 in 0.14 sec.
2025-11-14 16:03:13,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,888 - INFO - Going to convert document batch...
2025-11-14 16:03:13,888 - INFO - Processing document 8-K_2025-06-16
2025-11-14 16:03:13,942 - INFO - Finished converting document 8-K_2025-06-16 in 0.11 sec.


Converted 'data\edgar_documents\COF\8-K_2025-06-09' --> 'data\processed_data\COF\8-K_2025-06-09.md'
Converted 'data\edgar_documents\COF\8-K_2025-06-16' --> 'data\processed_data\COF\8-K_2025-06-16.md'


2025-11-14 16:03:14,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,048 - INFO - Going to convert document batch...
2025-11-14 16:03:14,050 - INFO - Processing document 8-K_2025-06-25
2025-11-14 16:03:14,093 - INFO - Finished converting document 8-K_2025-06-25 in 0.11 sec.
2025-11-14 16:03:14,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,155 - INFO - Going to convert document batch...
2025-11-14 16:03:14,156 - INFO - Processing document 8-K_2025-06-30
2025-11-14 16:03:14,212 - INFO - Finished converting document 8-K_2025-06-30 in 0.09 sec.
2025-11-14 16:03:14,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,274 - INFO - Going to convert document batch...
2025-11-14 16:03:14,275 - INFO - Processing document 8-K_2025-07-01
2025-11-14 16:03:14,311 - INFO - Finished converting document 8-K_2025-07-01 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2025-06-25' --> 'data\processed_data\COF\8-K_2025-06-25.md'
Converted 'data\edgar_documents\COF\8-K_2025-06-30' --> 'data\processed_data\COF\8-K_2025-06-30.md'


2025-11-14 16:03:14,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,374 - INFO - Going to convert document batch...
2025-11-14 16:03:14,375 - INFO - Processing document 8-K_2025-07-22
2025-11-14 16:03:14,409 - INFO - Finished converting document 8-K_2025-07-22 in 0.08 sec.
2025-11-14 16:03:14,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,484 - INFO - Going to convert document batch...
2025-11-14 16:03:14,485 - INFO - Processing document 8-K_2025-08-15
2025-11-14 16:03:14,519 - INFO - Finished converting document 8-K_2025-08-15 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2025-07-01' --> 'data\processed_data\COF\8-K_2025-07-01.md'
Converted 'data\edgar_documents\COF\8-K_2025-07-22' --> 'data\processed_data\COF\8-K_2025-07-22.md'


2025-11-14 16:03:14,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,584 - INFO - Going to convert document batch...
2025-11-14 16:03:14,585 - INFO - Processing document 8-K_2025-09-08
2025-11-14 16:03:14,639 - INFO - Finished converting document 8-K_2025-09-08 in 0.11 sec.
2025-11-14 16:03:14,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,734 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2025-08-15' --> 'data\processed_data\COF\8-K_2025-08-15.md'
Converted 'data\edgar_documents\COF\8-K_2025-09-08' --> 'data\processed_data\COF\8-K_2025-09-08.md'


2025-11-14 16:03:14,735 - INFO - Processing document 8-K_2025-09-11
2025-11-14 16:03:14,800 - INFO - Finished converting document 8-K_2025-09-11 in 0.14 sec.
2025-11-14 16:03:14,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,876 - INFO - Going to convert document batch...
2025-11-14 16:03:14,878 - INFO - Processing document 8-K_2025-09-15
2025-11-14 16:03:14,914 - INFO - Finished converting document 8-K_2025-09-15 in 0.08 sec.
2025-11-14 16:03:14,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,987 - INFO - Going to convert document batch...
2025-11-14 16:03:14,988 - INFO - Processing document 8-K_2025-10-21
2025-11-14 16:03:15,020 - INFO - Finished converting document 8-K_2025-10-21 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2025-09-11' --> 'data\processed_data\COF\8-K_2025-09-11.md'
Converted 'data\edgar_documents\COF\8-K_2025-09-15' --> 'data\processed_data\COF\8-K_2025-09-15.md'


2025-11-14 16:03:15,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:15,091 - INFO - Going to convert document batch...
2025-11-14 16:03:15,092 - INFO - Processing document 8-K_2025-11-07
2025-11-14 16:03:15,130 - INFO - Finished converting document 8-K_2025-11-07 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2025-10-21' --> 'data\processed_data\COF\8-K_2025-10-21.md'
Converted 'data\edgar_documents\COF\8-K_2025-11-07' --> 'data\processed_data\COF\8-K_2025-11-07.md'


2025-11-14 16:03:15,266 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:03:15,267 - ERROR - Input document DEF-14A_2023-03-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:03:15,271 - INFO - Going to convert document batch...
2025-11-14 16:03:15,321 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:03:15,323 - ERROR - Input document DEF-14A_2024-03-20 with format No

Error processing data\edgar_documents\COF\DEF-14A_2023-03-22: File format not allowed: data\edgar_documents\COF\DEF-14A_2023-03-22
Error processing data\edgar_documents\COF\DEF-14A_2024-03-20: File format not allowed: data\edgar_documents\COF\DEF-14A_2024-03-20
Error processing data\edgar_documents\COF\DEF-14A_2025-03-27: File format not allowed: data\edgar_documents\COF\DEF-14A_2025-03-27
Processed 153 new files. Errors: 33
Found 124 files to process in data\edgar_documents\COP


2025-11-14 16:03:15,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:20,709 - INFO - Going to convert document batch...
2025-11-14 16:03:20,712 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:03:20,713 - INFO - Processing document 10-K_2023-02-16
2025-11-14 16:03:33,030 - INFO - Finished converting document 10-K_2023-02-16 in 17.64 sec.
2025-11-14 16:03:36,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-K_2023-02-16' --> 'data\processed_data\COP\10-K_2023-02-16.md'


2025-11-14 16:03:40,338 - INFO - Going to convert document batch...
2025-11-14 16:03:40,339 - INFO - Processing document 10-K_2024-02-15
2025-11-14 16:03:52,073 - INFO - Finished converting document 10-K_2024-02-15 in 15.91 sec.
2025-11-14 16:03:55,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-K_2024-02-15' --> 'data\processed_data\COP\10-K_2024-02-15.md'


2025-11-14 16:04:00,131 - INFO - Going to convert document batch...
2025-11-14 16:04:00,133 - INFO - Processing document 10-K_2025-02-18
2025-11-14 16:04:11,729 - INFO - Finished converting document 10-K_2025-02-18 in 16.45 sec.
2025-11-14 16:04:15,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-K_2025-02-18' --> 'data\processed_data\COP\10-K_2025-02-18.md'


2025-11-14 16:04:16,221 - INFO - Going to convert document batch...
2025-11-14 16:04:16,223 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 16:04:18,577 - INFO - Finished converting document 10-Q_2023-05-04 in 3.44 sec.
2025-11-14 16:04:19,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2023-05-04' --> 'data\processed_data\COP\10-Q_2023-05-04.md'


2025-11-14 16:04:19,813 - INFO - Going to convert document batch...
2025-11-14 16:04:19,813 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 16:04:21,637 - INFO - Finished converting document 10-Q_2023-08-03 in 2.30 sec.
2025-11-14 16:04:22,434 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:04:22,436 - ERROR - Input document 10-Q_2023-11-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:04:22,441 - INFO - Going to convert d

Converted 'data\edgar_documents\COP\10-Q_2023-08-03' --> 'data\processed_data\COP\10-Q_2023-08-03.md'
Error processing data\edgar_documents\COP\10-Q_2023-11-02: File format not allowed: data\edgar_documents\COP\10-Q_2023-11-02


2025-11-14 16:04:23,386 - INFO - Going to convert document batch...
2025-11-14 16:04:23,388 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 16:04:27,561 - INFO - Finished converting document 10-Q_2024-05-02 in 5.12 sec.
2025-11-14 16:04:28,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2024-05-02' --> 'data\processed_data\COP\10-Q_2024-05-02.md'


2025-11-14 16:04:30,193 - INFO - Going to convert document batch...
2025-11-14 16:04:30,198 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 16:04:33,042 - INFO - Finished converting document 10-Q_2024-08-01 in 4.36 sec.
2025-11-14 16:04:34,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2024-08-01' --> 'data\processed_data\COP\10-Q_2024-08-01.md'


2025-11-14 16:04:36,284 - INFO - Going to convert document batch...
2025-11-14 16:04:36,286 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 16:04:39,086 - INFO - Finished converting document 10-Q_2024-10-31 in 5.08 sec.
2025-11-14 16:04:40,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2024-10-31' --> 'data\processed_data\COP\10-Q_2024-10-31.md'


2025-11-14 16:04:41,730 - INFO - Going to convert document batch...
2025-11-14 16:04:41,733 - INFO - Processing document 10-Q_2025-05-08
2025-11-14 16:04:44,357 - INFO - Finished converting document 10-Q_2025-05-08 in 3.97 sec.
2025-11-14 16:04:46,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2025-05-08' --> 'data\processed_data\COP\10-Q_2025-05-08.md'


2025-11-14 16:04:48,455 - INFO - Going to convert document batch...
2025-11-14 16:04:48,457 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 16:04:51,648 - INFO - Finished converting document 10-Q_2025-08-07 in 4.88 sec.
2025-11-14 16:04:53,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2025-08-07' --> 'data\processed_data\COP\10-Q_2025-08-07.md'


2025-11-14 16:04:55,844 - INFO - Going to convert document batch...
2025-11-14 16:04:55,846 - INFO - Processing document 10-Q_2025-11-06
2025-11-14 16:04:59,367 - INFO - Finished converting document 10-Q_2025-11-06 in 5.95 sec.
2025-11-14 16:05:01,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:01,345 - INFO - Going to convert document batch...
2025-11-14 16:05:01,348 - INFO - Processing document 4_2023-01-04
2025-11-14 16:05:01,414 - INFO - Finished converting document 4_2023-01-04 in 0.11 sec.
2025-11-14 16:05:01,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2025-11-06' --> 'data\processed_data\COP\10-Q_2025-11-06.md'
Converted 'data\edgar_documents\COP\4_2023-01-04' --> 'data\processed_data\COP\4_2023-01-04.md'


2025-11-14 16:05:01,507 - INFO - Going to convert document batch...
2025-11-14 16:05:01,509 - INFO - Processing document 4_2023-01-06
2025-11-14 16:05:01,547 - INFO - Finished converting document 4_2023-01-06 in 0.08 sec.
2025-11-14 16:05:01,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:01,616 - INFO - Going to convert document batch...
2025-11-14 16:05:01,617 - INFO - Processing document 4_2023-01-18
2025-11-14 16:05:01,654 - INFO - Finished converting document 4_2023-01-18 in 0.08 sec.
2025-11-14 16:05:01,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:01,766 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COP\4_2023-01-06' --> 'data\processed_data\COP\4_2023-01-06.md'
Converted 'data\edgar_documents\COP\4_2023-01-18' --> 'data\processed_data\COP\4_2023-01-18.md'


2025-11-14 16:05:01,767 - INFO - Processing document 4_2023-02-02
2025-11-14 16:05:01,837 - INFO - Finished converting document 4_2023-02-02 in 0.12 sec.
2025-11-14 16:05:01,932 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:01,969 - INFO - Going to convert document batch...
2025-11-14 16:05:01,972 - INFO - Processing document 4_2023-02-14
2025-11-14 16:05:02,063 - INFO - Finished converting document 4_2023-02-14 in 0.16 sec.


Converted 'data\edgar_documents\COP\4_2023-02-02' --> 'data\processed_data\COP\4_2023-02-02.md'


2025-11-14 16:05:02,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,193 - INFO - Going to convert document batch...
2025-11-14 16:05:02,197 - INFO - Processing document 4_2023-02-16
2025-11-14 16:05:02,252 - INFO - Finished converting document 4_2023-02-16 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2023-02-14' --> 'data\processed_data\COP\4_2023-02-14.md'
Converted 'data\edgar_documents\COP\4_2023-02-16' --> 'data\processed_data\COP\4_2023-02-16.md'


2025-11-14 16:05:02,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,370 - INFO - Going to convert document batch...
2025-11-14 16:05:02,372 - INFO - Processing document 4_2023-02-21
2025-11-14 16:05:02,428 - INFO - Finished converting document 4_2023-02-21 in 0.11 sec.
2025-11-14 16:05:02,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,565 - INFO - Going to convert document batch...
2025-11-14 16:05:02,568 - INFO - Processing document 4_2023-02-22
2025-11-14 16:05:02,646 - INFO - Finished converting document 4_2023-02-22 in 0.14 sec.


Converted 'data\edgar_documents\COP\4_2023-02-21' --> 'data\processed_data\COP\4_2023-02-21.md'


2025-11-14 16:05:02,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,779 - INFO - Going to convert document batch...
2025-11-14 16:05:02,781 - INFO - Processing document 4_2023-02-23
2025-11-14 16:05:02,843 - INFO - Finished converting document 4_2023-02-23 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2023-02-22' --> 'data\processed_data\COP\4_2023-02-22.md'
Converted 'data\edgar_documents\COP\4_2023-02-23' --> 'data\processed_data\COP\4_2023-02-23.md'


2025-11-14 16:05:02,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,970 - INFO - Going to convert document batch...
2025-11-14 16:05:02,971 - INFO - Processing document 4_2023-03-02
2025-11-14 16:05:03,019 - INFO - Finished converting document 4_2023-03-02 in 0.11 sec.
2025-11-14 16:05:03,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,141 - INFO - Going to convert document batch...
2025-11-14 16:05:03,144 - INFO - Processing document 4_2023-04-04
2025-11-14 16:05:03,209 - INFO - Finished converting document 4_2023-04-04 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2023-03-02' --> 'data\processed_data\COP\4_2023-03-02.md'


2025-11-14 16:05:03,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,305 - INFO - Going to convert document batch...
2025-11-14 16:05:03,306 - INFO - Processing document 4_2023-04-19
2025-11-14 16:05:03,357 - INFO - Finished converting document 4_2023-04-19 in 0.09 sec.
2025-11-14 16:05:03,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,452 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COP\4_2023-04-04' --> 'data\processed_data\COP\4_2023-04-04.md'
Converted 'data\edgar_documents\COP\4_2023-04-19' --> 'data\processed_data\COP\4_2023-04-19.md'


2025-11-14 16:05:03,456 - INFO - Processing document 4_2023-05-02
2025-11-14 16:05:03,518 - INFO - Finished converting document 4_2023-05-02 in 0.11 sec.
2025-11-14 16:05:03,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,602 - INFO - Going to convert document batch...
2025-11-14 16:05:03,603 - INFO - Processing document 4_2023-05-09
2025-11-14 16:05:03,637 - INFO - Finished converting document 4_2023-05-09 in 0.08 sec.
2025-11-14 16:05:03,732 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:03,734 - ERROR - Input document 4_2023-05-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\COP\4_2023-05-02' --> 'data\processed_data\COP\4_2023-05-02.md'
Converted 'data\edgar_documents\COP\4_2023-05-09' --> 'data\processed_data\COP\4_2023-05-09.md'
Error processing data\edgar_documents\COP\4_2023-05-10: File format not allowed: data\edgar_documents\COP\4_2023-05-10


2025-11-14 16:05:03,807 - INFO - Going to convert document batch...
2025-11-14 16:05:03,809 - INFO - Processing document 4_2023-06-01
2025-11-14 16:05:03,878 - INFO - Finished converting document 4_2023-06-01 in 0.14 sec.
2025-11-14 16:05:03,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,959 - INFO - Going to convert document batch...
2025-11-14 16:05:03,959 - INFO - Processing document 4_2023-07-05
2025-11-14 16:05:03,995 - INFO - Finished converting document 4_2023-07-05 in 0.08 sec.
2025-11-14 16:05:04,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,087 - INFO - Going to convert document batch...
2025-11-14 16:05:04,092 - INFO - Processing document 4_2023-08-02


Converted 'data\edgar_documents\COP\4_2023-06-01' --> 'data\processed_data\COP\4_2023-06-01.md'
Converted 'data\edgar_documents\COP\4_2023-07-05' --> 'data\processed_data\COP\4_2023-07-05.md'


2025-11-14 16:05:04,136 - INFO - Finished converting document 4_2023-08-02 in 0.11 sec.
2025-11-14 16:05:04,233 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:04,235 - ERROR - Input document 4_2023-08-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05:04,237 - INFO - Going to convert document batch...
2025-11-14 16:05:04,277 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:04,278 - ERROR - Input document 4_2023-08-09 with forma

Converted 'data\edgar_documents\COP\4_2023-08-02' --> 'data\processed_data\COP\4_2023-08-02.md'
Error processing data\edgar_documents\COP\4_2023-08-08: File format not allowed: data\edgar_documents\COP\4_2023-08-08
Error processing data\edgar_documents\COP\4_2023-08-09: File format not allowed: data\edgar_documents\COP\4_2023-08-09


2025-11-14 16:05:04,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,421 - INFO - Going to convert document batch...
2025-11-14 16:05:04,422 - INFO - Processing document 4_2023-09-06
2025-11-14 16:05:04,466 - INFO - Finished converting document 4_2023-09-06 in 0.08 sec.
2025-11-14 16:05:04,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,551 - INFO - Going to convert document batch...
2025-11-14 16:05:04,552 - INFO - Processing document 4_2023-09-19


Converted 'data\edgar_documents\COP\4_2023-09-05' --> 'data\processed_data\COP\4_2023-09-05.md'
Converted 'data\edgar_documents\COP\4_2023-09-06' --> 'data\processed_data\COP\4_2023-09-06.md'


2025-11-14 16:05:04,586 - INFO - Finished converting document 4_2023-09-19 in 0.06 sec.
2025-11-14 16:05:04,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,653 - INFO - Going to convert document batch...
2025-11-14 16:05:04,654 - INFO - Processing document 4_2023-09-20
2025-11-14 16:05:04,690 - INFO - Finished converting document 4_2023-09-20 in 0.06 sec.
2025-11-14 16:05:04,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2023-09-19' --> 'data\processed_data\COP\4_2023-09-19.md'
Converted 'data\edgar_documents\COP\4_2023-09-20' --> 'data\processed_data\COP\4_2023-09-20.md'


2025-11-14 16:05:04,808 - INFO - Going to convert document batch...
2025-11-14 16:05:04,811 - INFO - Processing document 4_2023-09-28
2025-11-14 16:05:04,883 - INFO - Finished converting document 4_2023-09-28 in 0.14 sec.
2025-11-14 16:05:04,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,957 - INFO - Going to convert document batch...
2025-11-14 16:05:04,959 - INFO - Processing document 4_2023-10-03
2025-11-14 16:05:04,995 - INFO - Finished converting document 4_2023-10-03 in 0.08 sec.
2025-11-14 16:05:05,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:05,060 - INFO - Going to convert document batch...
2025-11-14 16:05:05,063 - INFO - Processing document 4_2023-11-02


Converted 'data\edgar_documents\COP\4_2023-09-28' --> 'data\processed_data\COP\4_2023-09-28.md'
Converted 'data\edgar_documents\COP\4_2023-10-03' --> 'data\processed_data\COP\4_2023-10-03.md'


2025-11-14 16:05:05,109 - INFO - Finished converting document 4_2023-11-02 in 0.08 sec.
2025-11-14 16:05:05,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:05,181 - INFO - Going to convert document batch...
2025-11-14 16:05:05,182 - INFO - Processing document 4_2023-11-13
2025-11-14 16:05:05,216 - INFO - Finished converting document 4_2023-11-13 in 0.08 sec.
2025-11-14 16:05:05,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:05,287 - INFO - Going to convert document batch...
2025-11-14 16:05:05,290 - INFO - Processing document 4_2023-12-04
2025-11-14 16:05:05,325 - INFO - Finished converting document 4_2023-12-04 in 0.08 sec.


Converted 'data\edgar_documents\COP\4_2023-11-02' --> 'data\processed_data\COP\4_2023-11-02.md'
Converted 'data\edgar_documents\COP\4_2023-11-13' --> 'data\processed_data\COP\4_2023-11-13.md'


2025-11-14 16:05:05,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:05,394 - INFO - Going to convert document batch...
2025-11-14 16:05:05,395 - INFO - Processing document 4_2023-12-18
2025-11-14 16:05:05,437 - INFO - Finished converting document 4_2023-12-18 in 0.08 sec.
2025-11-14 16:05:05,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2023-12-04' --> 'data\processed_data\COP\4_2023-12-04.md'
Converted 'data\edgar_documents\COP\4_2023-12-18' --> 'data\processed_data\COP\4_2023-12-18.md'


2025-11-14 16:05:06,238 - INFO - Going to convert document batch...
2025-11-14 16:05:06,240 - INFO - Processing document 4_2024-01-02
2025-11-14 16:05:06,276 - INFO - Finished converting document 4_2024-01-02 in 0.81 sec.
2025-11-14 16:05:06,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:06,500 - INFO - Going to convert document batch...
2025-11-14 16:05:06,502 - INFO - Processing document 4_2024-01-04


Converted 'data\edgar_documents\COP\4_2024-01-02' --> 'data\processed_data\COP\4_2024-01-02.md'


2025-11-14 16:05:06,558 - INFO - Finished converting document 4_2024-01-04 in 0.23 sec.
2025-11-14 16:05:06,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:06,656 - INFO - Going to convert document batch...
2025-11-14 16:05:06,657 - INFO - Processing document 4_2024-01-05
2025-11-14 16:05:06,691 - INFO - Finished converting document 4_2024-01-05 in 0.08 sec.
2025-11-14 16:05:06,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:06,759 - INFO - Going to convert document batch...
2025-11-14 16:05:06,760 - INFO - Processing document 4_2024-01-17
2025-11-14 16:05:06,781 - INFO - Finished converting document 4_2024-01-17 in 0.06 sec.


Converted 'data\edgar_documents\COP\4_2024-01-04' --> 'data\processed_data\COP\4_2024-01-04.md'
Converted 'data\edgar_documents\COP\4_2024-01-05' --> 'data\processed_data\COP\4_2024-01-05.md'
Converted 'data\edgar_documents\COP\4_2024-01-17' --> 'data\processed_data\COP\4_2024-01-17.md'


2025-11-14 16:05:06,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:06,874 - INFO - Going to convert document batch...
2025-11-14 16:05:06,890 - INFO - Processing document 4_2024-02-02
2025-11-14 16:05:06,927 - INFO - Finished converting document 4_2024-02-02 in 0.11 sec.
2025-11-14 16:05:06,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,007 - INFO - Going to convert document batch...
2025-11-14 16:05:07,008 - INFO - Processing document 4_2024-02-13
2025-11-14 16:05:07,077 - INFO - Finished converting document 4_2024-02-13 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2024-02-02' --> 'data\processed_data\COP\4_2024-02-02.md'
Converted 'data\edgar_documents\COP\4_2024-02-13' --> 'data\processed_data\COP\4_2024-02-13.md'


2025-11-14 16:05:07,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,203 - INFO - Going to convert document batch...
2025-11-14 16:05:07,206 - INFO - Processing document 4_2024-02-14
2025-11-14 16:05:07,286 - INFO - Finished converting document 4_2024-02-14 in 0.14 sec.
2025-11-14 16:05:07,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,357 - INFO - Going to convert document batch...
2025-11-14 16:05:07,358 - INFO - Processing document 4_2024-02-22
2025-11-14 16:05:07,390 - INFO - Finished converting document 4_2024-02-22 in 0.06 sec.
2025-11-14 16:05:07,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,471 - INFO - Going to convert document batch...
2025-11-14 16:05:07,472 - INFO - Processing document 4_2024-02-29
2025-11-14 16:05:07,505 - INFO - Finished converting document 4_2024-02-29 in 0.08 sec.


Converted 'data\edgar_documents\COP\4_2024-02-14' --> 'data\processed_data\COP\4_2024-02-14.md'
Converted 'data\edgar_documents\COP\4_2024-02-22' --> 'data\processed_data\COP\4_2024-02-22.md'


2025-11-14 16:05:07,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,591 - INFO - Going to convert document batch...
2025-11-14 16:05:07,593 - INFO - Processing document 4_2024-03-04
2025-11-14 16:05:07,628 - INFO - Finished converting document 4_2024-03-04 in 0.08 sec.
2025-11-14 16:05:07,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,713 - INFO - Going to convert document batch...
2025-11-14 16:05:07,714 - INFO - Processing document 4_2024-03-25


Converted 'data\edgar_documents\COP\4_2024-02-29' --> 'data\processed_data\COP\4_2024-02-29.md'
Converted 'data\edgar_documents\COP\4_2024-03-04' --> 'data\processed_data\COP\4_2024-03-04.md'


2025-11-14 16:05:07,762 - INFO - Finished converting document 4_2024-03-25 in 0.11 sec.
2025-11-14 16:05:07,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,877 - INFO - Going to convert document batch...
2025-11-14 16:05:07,879 - INFO - Processing document 4_2024-03-26
2025-11-14 16:05:07,951 - INFO - Finished converting document 4_2024-03-26 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2024-03-25' --> 'data\processed_data\COP\4_2024-03-25.md'
Converted 'data\edgar_documents\COP\4_2024-03-26' --> 'data\processed_data\COP\4_2024-03-26.md'


2025-11-14 16:05:08,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:08,064 - INFO - Going to convert document batch...
2025-11-14 16:05:08,066 - INFO - Processing document 4_2024-04-02
2025-11-14 16:05:08,104 - INFO - Finished converting document 4_2024-04-02 in 0.09 sec.
2025-11-14 16:05:08,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:08,170 - INFO - Going to convert document batch...
2025-11-14 16:05:08,178 - INFO - Processing document 4_2024-04-17
2025-11-14 16:05:08,226 - INFO - Finished converting document 4_2024-04-17 in 0.08 sec.
2025-11-14 16:05:08,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2024-04-02' --> 'data\processed_data\COP\4_2024-04-02.md'
Converted 'data\edgar_documents\COP\4_2024-04-17' --> 'data\processed_data\COP\4_2024-04-17.md'


2025-11-14 16:05:08,343 - INFO - Going to convert document batch...
2025-11-14 16:05:08,346 - INFO - Processing document 4_2024-05-02
2025-11-14 16:05:08,398 - INFO - Finished converting document 4_2024-05-02 in 0.09 sec.
2025-11-14 16:05:08,479 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:08,481 - ERROR - Input document 4_2024-05-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05:08,483 - INFO - Going to convert document batch...
2025-11-14 16:05:08,505 - IN

Converted 'data\edgar_documents\COP\4_2024-05-02' --> 'data\processed_data\COP\4_2024-05-02.md'
Error processing data\edgar_documents\COP\4_2024-05-29: File format not allowed: data\edgar_documents\COP\4_2024-05-29
Converted 'data\edgar_documents\COP\4_2024-06-04' --> 'data\processed_data\COP\4_2024-06-04.md'


2025-11-14 16:05:08,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:08,715 - INFO - Going to convert document batch...
2025-11-14 16:05:08,718 - INFO - Processing document 4_2024-07-02
2025-11-14 16:05:08,842 - INFO - Finished converting document 4_2024-07-02 in 0.20 sec.
2025-11-14 16:05:08,905 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:08,907 - ERROR - Input document 4_2024-07-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05

Converted 'data\edgar_documents\COP\4_2024-07-02' --> 'data\processed_data\COP\4_2024-07-02.md'
Error processing data\edgar_documents\COP\4_2024-07-12: File format not allowed: data\edgar_documents\COP\4_2024-07-12
Error processing data\edgar_documents\COP\4_2024-07-29: File format not allowed: data\edgar_documents\COP\4_2024-07-29
Error processing data\edgar_documents\COP\4_2024-08-01: File format not allowed: data\edgar_documents\COP\4_2024-08-01


2025-11-14 16:05:09,100 - INFO - Going to convert document batch...
2025-11-14 16:05:09,102 - INFO - Processing document 4_2024-08-02
2025-11-14 16:05:09,163 - INFO - Finished converting document 4_2024-08-02 in 0.11 sec.
2025-11-14 16:05:09,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:09,257 - INFO - Going to convert document batch...
2025-11-14 16:05:09,259 - INFO - Processing document 4_2024-08-14
2025-11-14 16:05:09,327 - INFO - Finished converting document 4_2024-08-14 in 0.12 sec.
2025-11-14 16:05:09,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2024-08-02' --> 'data\processed_data\COP\4_2024-08-02.md'
Converted 'data\edgar_documents\COP\4_2024-08-14' --> 'data\processed_data\COP\4_2024-08-14.md'


2025-11-14 16:05:09,459 - INFO - Going to convert document batch...
2025-11-14 16:05:09,462 - INFO - Processing document 4_2024-09-04
2025-11-14 16:05:09,506 - INFO - Finished converting document 4_2024-09-04 in 0.11 sec.
2025-11-14 16:05:09,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:09,609 - INFO - Going to convert document batch...
2025-11-14 16:05:09,611 - INFO - Processing document 4_2024-10-02
2025-11-14 16:05:09,674 - INFO - Finished converting document 4_2024-10-02 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2024-09-04' --> 'data\processed_data\COP\4_2024-09-04.md'


2025-11-14 16:05:09,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:09,822 - INFO - Going to convert document batch...
2025-11-14 16:05:09,824 - INFO - Processing document 4_2024-11-04
2025-11-14 16:05:09,876 - INFO - Finished converting document 4_2024-11-04 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2024-10-02' --> 'data\processed_data\COP\4_2024-10-02.md'
Converted 'data\edgar_documents\COP\4_2024-11-04' --> 'data\processed_data\COP\4_2024-11-04.md'


2025-11-14 16:05:09,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:09,998 - INFO - Going to convert document batch...
2025-11-14 16:05:10,000 - INFO - Processing document 4_2024-11-22
2025-11-14 16:05:10,086 - INFO - Finished converting document 4_2024-11-22 in 0.16 sec.
2025-11-14 16:05:10,192 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:10,193 - ERROR - Input document 4_2024-11-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05

Converted 'data\edgar_documents\COP\4_2024-11-22' --> 'data\processed_data\COP\4_2024-11-22.md'
Error processing data\edgar_documents\COP\4_2024-11-25: File format not allowed: data\edgar_documents\COP\4_2024-11-25
Error processing data\edgar_documents\COP\4_2024-11-26: File format not allowed: data\edgar_documents\COP\4_2024-11-26


2025-11-14 16:05:10,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:10,467 - INFO - Going to convert document batch...
2025-11-14 16:05:10,469 - INFO - Processing document 4_2024-12-16
2025-11-14 16:05:10,542 - INFO - Finished converting document 4_2024-12-16 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2024-12-02' --> 'data\processed_data\COP\4_2024-12-02.md'
Converted 'data\edgar_documents\COP\4_2024-12-16' --> 'data\processed_data\COP\4_2024-12-16.md'


2025-11-14 16:05:10,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:10,656 - INFO - Going to convert document batch...
2025-11-14 16:05:10,657 - INFO - Processing document 4_2024-12-18
2025-11-14 16:05:10,711 - INFO - Finished converting document 4_2024-12-18 in 0.11 sec.
2025-11-14 16:05:10,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:10,814 - INFO - Going to convert document batch...
2025-11-14 16:05:10,817 - INFO - Processing document 4_2024-12-20
2025-11-14 16:05:10,881 - INFO - Finished converting document 4_2024-12-20 in 0.11 sec.
2025-11-14 16:05:10,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2024-12-18' --> 'data\processed_data\COP\4_2024-12-18.md'
Converted 'data\edgar_documents\COP\4_2024-12-20' --> 'data\processed_data\COP\4_2024-12-20.md'


2025-11-14 16:05:10,992 - INFO - Going to convert document batch...
2025-11-14 16:05:10,994 - INFO - Processing document 4_2024-12-30
2025-11-14 16:05:11,047 - INFO - Finished converting document 4_2024-12-30 in 0.11 sec.
2025-11-14 16:05:11,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:11,117 - INFO - Going to convert document batch...
2025-11-14 16:05:11,117 - INFO - Processing document 4_2025-01-02
2025-11-14 16:05:11,180 - INFO - Finished converting document 4_2025-01-02 in 0.09 sec.


Converted 'data\edgar_documents\COP\4_2024-12-30' --> 'data\processed_data\COP\4_2024-12-30.md'
Converted 'data\edgar_documents\COP\4_2025-01-02' --> 'data\processed_data\COP\4_2025-01-02.md'


2025-11-14 16:05:11,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:11,303 - INFO - Going to convert document batch...
2025-11-14 16:05:11,306 - INFO - Processing document 4_2025-01-17
2025-11-14 16:05:11,373 - INFO - Finished converting document 4_2025-01-17 in 0.14 sec.
2025-11-14 16:05:11,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:11,480 - INFO - Going to convert document batch...
2025-11-14 16:05:11,482 - INFO - Processing document 4_2025-02-04
2025-11-14 16:05:11,547 - INFO - Finished converting document 4_2025-02-04 in 0.11 sec.
2025-11-14 16:05:11,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2025-01-17' --> 'data\processed_data\COP\4_2025-01-17.md'
Converted 'data\edgar_documents\COP\4_2025-02-04' --> 'data\processed_data\COP\4_2025-02-04.md'


2025-11-14 16:05:11,685 - INFO - Going to convert document batch...
2025-11-14 16:05:11,686 - INFO - Processing document 4_2025-02-11
2025-11-14 16:05:11,727 - INFO - Finished converting document 4_2025-02-11 in 0.11 sec.
2025-11-14 16:05:11,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:11,821 - INFO - Going to convert document batch...
2025-11-14 16:05:11,822 - INFO - Processing document 4_2025-02-13
2025-11-14 16:05:11,858 - INFO - Finished converting document 4_2025-02-13 in 0.09 sec.
2025-11-14 16:05:11,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2025-02-11' --> 'data\processed_data\COP\4_2025-02-11.md'
Converted 'data\edgar_documents\COP\4_2025-02-13' --> 'data\processed_data\COP\4_2025-02-13.md'


2025-11-14 16:05:11,981 - INFO - Going to convert document batch...
2025-11-14 16:05:11,984 - INFO - Processing document 4_2025-03-04
2025-11-14 16:05:12,053 - INFO - Finished converting document 4_2025-03-04 in 0.12 sec.
2025-11-14 16:05:12,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:12,146 - INFO - Going to convert document batch...
2025-11-14 16:05:12,148 - INFO - Processing document 4_2025-04-02
2025-11-14 16:05:12,201 - INFO - Finished converting document 4_2025-04-02 in 0.09 sec.
2025-11-14 16:05:12,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2025-03-04' --> 'data\processed_data\COP\4_2025-03-04.md'
Converted 'data\edgar_documents\COP\4_2025-04-02' --> 'data\processed_data\COP\4_2025-04-02.md'


2025-11-14 16:05:12,301 - INFO - Going to convert document batch...
2025-11-14 16:05:12,305 - INFO - Processing document 4_2025-05-01
2025-11-14 16:05:12,376 - INFO - Finished converting document 4_2025-05-01 in 0.14 sec.
2025-11-14 16:05:12,464 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:12,466 - ERROR - Input document 4_2025-05-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05:12,468 - INFO - Going to convert document batch...
2025-11-14 16:05:12,488 - IN

Converted 'data\edgar_documents\COP\4_2025-05-01' --> 'data\processed_data\COP\4_2025-05-01.md'
Error processing data\edgar_documents\COP\4_2025-05-16: File format not allowed: data\edgar_documents\COP\4_2025-05-16


2025-11-14 16:05:12,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:12,713 - INFO - Going to convert document batch...
2025-11-14 16:05:12,715 - INFO - Processing document 4_2025-06-17
2025-11-14 16:05:12,758 - INFO - Finished converting document 4_2025-06-17 in 0.09 sec.
2025-11-14 16:05:12,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:12,829 - INFO - Going to convert document batch...
2025-11-14 16:05:12,830 - INFO - Processing document 4_2025-07-02


Converted 'data\edgar_documents\COP\4_2025-06-02' --> 'data\processed_data\COP\4_2025-06-02.md'
Converted 'data\edgar_documents\COP\4_2025-06-17' --> 'data\processed_data\COP\4_2025-06-17.md'


2025-11-14 16:05:12,867 - INFO - Finished converting document 4_2025-07-02 in 0.06 sec.
2025-11-14 16:05:12,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:12,996 - INFO - Going to convert document batch...
2025-11-14 16:05:13,002 - INFO - Processing document 4_2025-08-04
2025-11-14 16:05:13,051 - INFO - Finished converting document 4_2025-08-04 in 0.12 sec.
2025-11-14 16:05:13,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2025-07-02' --> 'data\processed_data\COP\4_2025-07-02.md'
Converted 'data\edgar_documents\COP\4_2025-08-04' --> 'data\processed_data\COP\4_2025-08-04.md'


2025-11-14 16:05:13,131 - INFO - Going to convert document batch...
2025-11-14 16:05:13,132 - INFO - Processing document 4_2025-09-03
2025-11-14 16:05:13,169 - INFO - Finished converting document 4_2025-09-03 in 0.08 sec.
2025-11-14 16:05:13,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,239 - INFO - Going to convert document batch...
2025-11-14 16:05:13,242 - INFO - Processing document 4_2025-10-02
2025-11-14 16:05:13,317 - INFO - Finished converting document 4_2025-10-02 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2025-09-03' --> 'data\processed_data\COP\4_2025-09-03.md'
Converted 'data\edgar_documents\COP\4_2025-10-02' --> 'data\processed_data\COP\4_2025-10-02.md'


2025-11-14 16:05:13,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,415 - INFO - Going to convert document batch...
2025-11-14 16:05:13,416 - INFO - Processing document 4_2025-11-10
2025-11-14 16:05:13,457 - INFO - Finished converting document 4_2025-11-10 in 0.09 sec.
2025-11-14 16:05:13,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,574 - INFO - Going to convert document batch...
2025-11-14 16:05:13,576 - INFO - Processing document 8-K_2023-02-02
2025-11-14 16:05:13,622 - INFO - Finished converting document 8-K_2023-02-02 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2025-11-10' --> 'data\processed_data\COP\4_2025-11-10.md'
Converted 'data\edgar_documents\COP\8-K_2023-02-02' --> 'data\processed_data\COP\8-K_2023-02-02.md'


2025-11-14 16:05:13,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,724 - INFO - Going to convert document batch...
2025-11-14 16:05:13,727 - INFO - Processing document 8-K_2023-05-04
2025-11-14 16:05:13,791 - INFO - Finished converting document 8-K_2023-05-04 in 0.16 sec.
2025-11-14 16:05:13,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,915 - INFO - Going to convert document batch...
2025-11-14 16:05:13,917 - INFO - Processing document 8-K_2023-05-18


Converted 'data\edgar_documents\COP\8-K_2023-05-04' --> 'data\processed_data\COP\8-K_2023-05-04.md'


2025-11-14 16:05:14,094 - INFO - Finished converting document 8-K_2023-05-18 in 0.27 sec.
2025-11-14 16:05:14,296 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:14,325 - INFO - Going to convert document batch...
2025-11-14 16:05:14,326 - INFO - Processing document 8-K_2023-05-23
2025-11-14 16:05:14,362 - INFO - Finished converting document 8-K_2023-05-23 in 0.09 sec.
2025-11-14 16:05:14,432 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2023-05-18' --> 'data\processed_data\COP\8-K_2023-05-18.md'
Converted 'data\edgar_documents\COP\8-K_2023-05-23' --> 'data\processed_data\COP\8-K_2023-05-23.md'


2025-11-14 16:05:14,474 - INFO - Going to convert document batch...
2025-11-14 16:05:14,477 - INFO - Processing document 8-K_2023-08-03
2025-11-14 16:05:14,529 - INFO - Finished converting document 8-K_2023-08-03 in 0.14 sec.
2025-11-14 16:05:14,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:14,621 - INFO - Going to convert document batch...
2025-11-14 16:05:14,622 - INFO - Processing document 8-K_2023-08-17
2025-11-14 16:05:14,675 - INFO - Finished converting document 8-K_2023-08-17 in 0.12 sec.


Converted 'data\edgar_documents\COP\8-K_2023-08-03' --> 'data\processed_data\COP\8-K_2023-08-03.md'
Converted 'data\edgar_documents\COP\8-K_2023-08-17' --> 'data\processed_data\COP\8-K_2023-08-17.md'


2025-11-14 16:05:14,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:14,805 - INFO - Going to convert document batch...
2025-11-14 16:05:14,806 - INFO - Processing document 8-K_2023-11-02
2025-11-14 16:05:14,844 - INFO - Finished converting document 8-K_2023-11-02 in 0.12 sec.
2025-11-14 16:05:14,888 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:14,915 - INFO - Going to convert document batch...
2025-11-14 16:05:14,917 - INFO - Processing document 8-K_2024-02-08
2025-11-14 16:05:14,965 - INFO - Finished converting document 8-K_2024-02-08 in 0.09 sec.
2025-11-14 16:05:15,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2023-11-02' --> 'data\processed_data\COP\8-K_2023-11-02.md'
Converted 'data\edgar_documents\COP\8-K_2024-02-08' --> 'data\processed_data\COP\8-K_2024-02-08.md'


2025-11-14 16:05:15,072 - INFO - Going to convert document batch...
2025-11-14 16:05:15,076 - INFO - Processing document 8-K_2024-02-15
2025-11-14 16:05:15,138 - INFO - Finished converting document 8-K_2024-02-15 in 0.14 sec.
2025-11-14 16:05:15,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:15,219 - INFO - Going to convert document batch...
2025-11-14 16:05:15,223 - INFO - Processing document 8-K_2024-05-02
2025-11-14 16:05:15,272 - INFO - Finished converting document 8-K_2024-05-02 in 0.09 sec.
2025-11-14 16:05:15,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2024-02-15' --> 'data\processed_data\COP\8-K_2024-02-15.md'
Converted 'data\edgar_documents\COP\8-K_2024-05-02' --> 'data\processed_data\COP\8-K_2024-05-02.md'


2025-11-14 16:05:15,411 - INFO - Going to convert document batch...
2025-11-14 16:05:15,413 - INFO - Processing document 8-K_2024-05-16
2025-11-14 16:05:15,535 - INFO - Finished converting document 8-K_2024-05-16 in 0.23 sec.
2025-11-14 16:05:15,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:15,636 - INFO - Going to convert document batch...
2025-11-14 16:05:15,638 - INFO - Processing document 8-K_2024-05-29
2025-11-14 16:05:15,711 - INFO - Finished converting document 8-K_2024-05-29 in 0.12 sec.


Converted 'data\edgar_documents\COP\8-K_2024-05-16' --> 'data\processed_data\COP\8-K_2024-05-16.md'


2025-11-14 16:05:15,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:15,847 - INFO - Going to convert document batch...
2025-11-14 16:05:15,850 - INFO - Processing document 8-K_2024-07-02
2025-11-14 16:05:15,888 - INFO - Finished converting document 8-K_2024-07-02 in 0.09 sec.
2025-11-14 16:05:15,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:15,969 - INFO - Going to convert document batch...
2025-11-14 16:05:15,971 - INFO - Processing document 8-K_2024-07-12


Converted 'data\edgar_documents\COP\8-K_2024-05-29' --> 'data\processed_data\COP\8-K_2024-05-29.md'
Converted 'data\edgar_documents\COP\8-K_2024-07-02' --> 'data\processed_data\COP\8-K_2024-07-02.md'


2025-11-14 16:05:16,021 - INFO - Finished converting document 8-K_2024-07-12 in 0.11 sec.
2025-11-14 16:05:16,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:16,494 - INFO - Going to convert document batch...
2025-11-14 16:05:16,495 - INFO - Processing document 8-K_2024-08-01
2025-11-14 16:05:16,524 - INFO - Finished converting document 8-K_2024-08-01 in 0.06 sec.
2025-11-14 16:05:16,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:16,611 - INFO - Going to convert document batch...
2025-11-14 16:05:16,612 - INFO - Processing document 8-K_2024-09-03


Converted 'data\edgar_documents\COP\8-K_2024-07-12' --> 'data\processed_data\COP\8-K_2024-07-12.md'
Converted 'data\edgar_documents\COP\8-K_2024-08-01' --> 'data\processed_data\COP\8-K_2024-08-01.md'


2025-11-14 16:05:16,673 - INFO - Finished converting document 8-K_2024-09-03 in 0.14 sec.
2025-11-14 16:05:16,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:16,749 - INFO - Going to convert document batch...
2025-11-14 16:05:16,750 - INFO - Processing document 8-K_2024-10-31
2025-11-14 16:05:16,787 - INFO - Finished converting document 8-K_2024-10-31 in 0.06 sec.
2025-11-14 16:05:16,843 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2024-09-03' --> 'data\processed_data\COP\8-K_2024-09-03.md'
Converted 'data\edgar_documents\COP\8-K_2024-10-31' --> 'data\processed_data\COP\8-K_2024-10-31.md'


2025-11-14 16:05:16,912 - INFO - Going to convert document batch...
2025-11-14 16:05:16,914 - INFO - Processing document 8-K_2024-11-22
2025-11-14 16:05:17,066 - INFO - Finished converting document 8-K_2024-11-22 in 0.25 sec.
2025-11-14 16:05:17,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:17,202 - INFO - Going to convert document batch...
2025-11-14 16:05:17,203 - INFO - Processing document 8-K_2024-11-25
2025-11-14 16:05:17,271 - INFO - Finished converting document 8-K_2024-11-25 in 0.11 sec.


Converted 'data\edgar_documents\COP\8-K_2024-11-22' --> 'data\processed_data\COP\8-K_2024-11-22.md'
Converted 'data\edgar_documents\COP\8-K_2024-11-25' --> 'data\processed_data\COP\8-K_2024-11-25.md'


2025-11-14 16:05:17,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:17,387 - INFO - Going to convert document batch...
2025-11-14 16:05:17,389 - INFO - Processing document 8-K_2024-12-05
2025-11-14 16:05:17,485 - INFO - Finished converting document 8-K_2024-12-05 in 0.17 sec.
2025-11-14 16:05:17,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:17,625 - INFO - Going to convert document batch...
2025-11-14 16:05:17,627 - INFO - Processing document 8-K_2024-12-10
2025-11-14 16:05:17,696 - INFO - Finished converting document 8-K_2024-12-10 in 0.16 sec.


Converted 'data\edgar_documents\COP\8-K_2024-12-05' --> 'data\processed_data\COP\8-K_2024-12-05.md'


2025-11-14 16:05:17,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:17,828 - INFO - Going to convert document batch...
2025-11-14 16:05:17,830 - INFO - Processing document 8-K_2024-12-30
2025-11-14 16:05:17,891 - INFO - Finished converting document 8-K_2024-12-30 in 0.16 sec.


Converted 'data\edgar_documents\COP\8-K_2024-12-10' --> 'data\processed_data\COP\8-K_2024-12-10.md'


2025-11-14 16:05:17,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,002 - INFO - Going to convert document batch...
2025-11-14 16:05:18,002 - INFO - Processing document 8-K_2025-01-28
2025-11-14 16:05:18,048 - INFO - Finished converting document 8-K_2025-01-28 in 0.09 sec.
2025-11-14 16:05:18,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,129 - INFO - Going to convert document batch...
2025-11-14 16:05:18,130 - INFO - Processing document 8-K_2025-02-06
2025-11-14 16:05:18,154 - INFO - Finished converting document 8-K_2025-02-06 in 0.08 sec.


Converted 'data\edgar_documents\COP\8-K_2024-12-30' --> 'data\processed_data\COP\8-K_2024-12-30.md'
Converted 'data\edgar_documents\COP\8-K_2025-01-28' --> 'data\processed_data\COP\8-K_2025-01-28.md'


2025-11-14 16:05:18,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,199 - INFO - Going to convert document batch...
2025-11-14 16:05:18,201 - INFO - Processing document 8-K_2025-05-08
2025-11-14 16:05:18,232 - INFO - Finished converting document 8-K_2025-05-08 in 0.06 sec.
2025-11-14 16:05:18,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2025-02-06' --> 'data\processed_data\COP\8-K_2025-02-06.md'
Converted 'data\edgar_documents\COP\8-K_2025-05-08' --> 'data\processed_data\COP\8-K_2025-05-08.md'


2025-11-14 16:05:18,357 - INFO - Going to convert document batch...
2025-11-14 16:05:18,359 - INFO - Processing document 8-K_2025-05-15
2025-11-14 16:05:18,450 - INFO - Finished converting document 8-K_2025-05-15 in 0.20 sec.
2025-11-14 16:05:18,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,553 - INFO - Going to convert document batch...
2025-11-14 16:05:18,553 - INFO - Processing document 8-K_2025-07-01
2025-11-14 16:05:18,595 - INFO - Finished converting document 8-K_2025-07-01 in 0.09 sec.


Converted 'data\edgar_documents\COP\8-K_2025-05-15' --> 'data\processed_data\COP\8-K_2025-05-15.md'
Converted 'data\edgar_documents\COP\8-K_2025-07-01' --> 'data\processed_data\COP\8-K_2025-07-01.md'


2025-11-14 16:05:18,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,723 - INFO - Going to convert document batch...
2025-11-14 16:05:18,725 - INFO - Processing document 8-K_2025-08-07
2025-11-14 16:05:18,769 - INFO - Finished converting document 8-K_2025-08-07 in 0.11 sec.
2025-11-14 16:05:18,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,831 - INFO - Going to convert document batch...
2025-11-14 16:05:18,833 - INFO - Processing document 8-K_2025-11-06
2025-11-14 16:05:18,882 - INFO - Finished converting document 8-K_2025-11-06 in 0.09 sec.


Converted 'data\edgar_documents\COP\8-K_2025-08-07' --> 'data\processed_data\COP\8-K_2025-08-07.md'
Converted 'data\edgar_documents\COP\8-K_2025-11-06' --> 'data\processed_data\COP\8-K_2025-11-06.md'


2025-11-14 16:05:19,021 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:19,021 - ERROR - Input document DEF-14A_2023-04-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05:19,025 - INFO - Going to convert document batch...
2025-11-14 16:05:19,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\COP\DEF-14A_2023-04-03: File format not allowed: data\edgar_documents\COP\DEF-14A_2023-04-03


2025-11-14 16:05:21,252 - INFO - Going to convert document batch...
2025-11-14 16:05:21,254 - INFO - Processing document DEF-14A_2024-04-01
2025-11-14 16:05:49,662 - INFO - Finished converting document DEF-14A_2024-04-01 in 30.62 sec.
2025-11-14 16:05:52,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\DEF-14A_2024-04-01' --> 'data\processed_data\COP\DEF-14A_2024-04-01.md'


2025-11-14 16:05:55,434 - INFO - Going to convert document batch...
2025-11-14 16:05:55,436 - INFO - Processing document DEF-14A_2025-03-31
2025-11-14 16:06:55,526 - INFO - Finished converting document DEF-14A_2025-03-31 in 63.11 sec.
2025-11-14 16:06:59,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\DEF-14A_2025-03-31' --> 'data\processed_data\COP\DEF-14A_2025-03-31.md'
Processed 112 new files. Errors: 12
Found 104 files to process in data\edgar_documents\COST


2025-11-14 16:07:00,365 - INFO - Going to convert document batch...
2025-11-14 16:07:00,366 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:07:00,368 - INFO - Processing document 10-K_2023-10-11
2025-11-14 16:07:02,295 - INFO - Finished converting document 10-K_2023-10-11 in 3.06 sec.
2025-11-14 16:07:03,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-K_2023-10-11' --> 'data\processed_data\COST\10-K_2023-10-11.md'


2025-11-14 16:07:03,930 - INFO - Going to convert document batch...
2025-11-14 16:07:03,931 - INFO - Processing document 10-K_2024-10-09
2025-11-14 16:07:06,813 - INFO - Finished converting document 10-K_2024-10-09 in 3.70 sec.
2025-11-14 16:07:07,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-K_2024-10-09' --> 'data\processed_data\COST\10-K_2024-10-09.md'


2025-11-14 16:07:08,554 - INFO - Going to convert document batch...
2025-11-14 16:07:08,557 - INFO - Processing document 10-K_2025-10-08
2025-11-14 16:07:10,380 - INFO - Finished converting document 10-K_2025-10-08 in 2.73 sec.
2025-11-14 16:07:11,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-K_2025-10-08' --> 'data\processed_data\COST\10-K_2025-10-08.md'


2025-11-14 16:07:12,017 - INFO - Going to convert document batch...
2025-11-14 16:07:12,018 - INFO - Processing document 10-Q_2023-03-09
2025-11-14 16:07:13,017 - INFO - Finished converting document 10-Q_2023-03-09 in 1.72 sec.
2025-11-14 16:07:13,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2023-03-09' --> 'data\processed_data\COST\10-Q_2023-03-09.md'


2025-11-14 16:07:14,842 - INFO - Going to convert document batch...
2025-11-14 16:07:14,844 - INFO - Processing document 10-Q_2023-06-01
2025-11-14 16:07:15,940 - INFO - Finished converting document 10-Q_2023-06-01 in 2.41 sec.
2025-11-14 16:07:16,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2023-06-01' --> 'data\processed_data\COST\10-Q_2023-06-01.md'


2025-11-14 16:07:16,856 - INFO - Going to convert document batch...
2025-11-14 16:07:16,858 - INFO - Processing document 10-Q_2023-12-20
2025-11-14 16:07:17,576 - INFO - Finished converting document 10-Q_2023-12-20 in 1.14 sec.
2025-11-14 16:07:17,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2023-12-20' --> 'data\processed_data\COST\10-Q_2023-12-20.md'


2025-11-14 16:07:18,420 - INFO - Going to convert document batch...
2025-11-14 16:07:18,421 - INFO - Processing document 10-Q_2024-03-13
2025-11-14 16:07:19,289 - INFO - Finished converting document 10-Q_2024-03-13 in 1.34 sec.
2025-11-14 16:07:19,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2024-03-13' --> 'data\processed_data\COST\10-Q_2024-03-13.md'


2025-11-14 16:07:20,788 - INFO - Going to convert document batch...
2025-11-14 16:07:20,790 - INFO - Processing document 10-Q_2024-06-06
2025-11-14 16:07:21,734 - INFO - Finished converting document 10-Q_2024-06-06 in 2.00 sec.
2025-11-14 16:07:22,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2024-06-06' --> 'data\processed_data\COST\10-Q_2024-06-06.md'


2025-11-14 16:07:22,875 - INFO - Going to convert document batch...
2025-11-14 16:07:22,877 - INFO - Processing document 10-Q_2024-12-19
2025-11-14 16:07:23,634 - INFO - Finished converting document 10-Q_2024-12-19 in 1.19 sec.
2025-11-14 16:07:24,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2024-12-19' --> 'data\processed_data\COST\10-Q_2024-12-19.md'


2025-11-14 16:07:24,617 - INFO - Going to convert document batch...
2025-11-14 16:07:24,618 - INFO - Processing document 10-Q_2025-03-13
2025-11-14 16:07:25,674 - INFO - Finished converting document 10-Q_2025-03-13 in 1.56 sec.
2025-11-14 16:07:26,309 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2025-03-13' --> 'data\processed_data\COST\10-Q_2025-03-13.md'


2025-11-14 16:07:27,233 - INFO - Going to convert document batch...
2025-11-14 16:07:27,235 - INFO - Processing document 10-Q_2025-06-05
2025-11-14 16:07:28,404 - INFO - Finished converting document 10-Q_2025-06-05 in 2.16 sec.
2025-11-14 16:07:28,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:28,971 - INFO - Going to convert document batch...
2025-11-14 16:07:28,975 - INFO - Processing document 4_2023-01-31
2025-11-14 16:07:29,014 - INFO - Finished converting document 4_2023-01-31 in 0.08 sec.
2025-11-14 16:07:29,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:29,144 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COST\10-Q_2025-06-05' --> 'data\processed_data\COST\10-Q_2025-06-05.md'
Converted 'data\edgar_documents\COST\4_2023-01-31' --> 'data\processed_data\COST\4_2023-01-31.md'


2025-11-14 16:07:29,146 - INFO - Processing document 4_2023-03-07
2025-11-14 16:07:29,201 - INFO - Finished converting document 4_2023-03-07 in 0.12 sec.
2025-11-14 16:07:29,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:29,275 - INFO - Going to convert document batch...
2025-11-14 16:07:29,277 - INFO - Processing document 4_2023-03-08
2025-11-14 16:07:29,343 - INFO - Finished converting document 4_2023-03-08 in 0.11 sec.
2025-11-14 16:07:29,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2023-03-07' --> 'data\processed_data\COST\4_2023-03-07.md'
Converted 'data\edgar_documents\COST\4_2023-03-08' --> 'data\processed_data\COST\4_2023-03-08.md'


2025-11-14 16:07:29,459 - INFO - Going to convert document batch...
2025-11-14 16:07:29,461 - INFO - Processing document 4_2023-03-15
2025-11-14 16:07:29,549 - INFO - Finished converting document 4_2023-03-15 in 0.14 sec.
2025-11-14 16:07:29,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:29,680 - INFO - Going to convert document batch...
2025-11-14 16:07:29,681 - INFO - Processing document 4_2023-04-13
2025-11-14 16:07:29,737 - INFO - Finished converting document 4_2023-04-13 in 0.12 sec.


Converted 'data\edgar_documents\COST\4_2023-03-15' --> 'data\processed_data\COST\4_2023-03-15.md'
Converted 'data\edgar_documents\COST\4_2023-04-13' --> 'data\processed_data\COST\4_2023-04-13.md'


2025-11-14 16:07:29,833 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:29,865 - INFO - Going to convert document batch...
2025-11-14 16:07:29,867 - INFO - Processing document 4_2023-06-09
2025-11-14 16:07:29,935 - INFO - Finished converting document 4_2023-06-09 in 0.14 sec.
2025-11-14 16:07:30,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,015 - INFO - Going to convert document batch...
2025-11-14 16:07:30,016 - INFO - Processing document 4_2023-06-15
2025-11-14 16:07:30,058 - INFO - Finished converting document 4_2023-06-15 in 0.08 sec.
2025-11-14 16:07:30,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,165 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COST\4_2023-06-09' --> 'data\processed_data\COST\4_2023-06-09.md'
Converted 'data\edgar_documents\COST\4_2023-06-15' --> 'data\processed_data\COST\4_2023-06-15.md'


2025-11-14 16:07:30,167 - INFO - Processing document 4_2023-06-26
2025-11-14 16:07:30,208 - INFO - Finished converting document 4_2023-06-26 in 0.09 sec.
2025-11-14 16:07:30,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,289 - INFO - Going to convert document batch...
2025-11-14 16:07:30,292 - INFO - Processing document 4_2023-06-29
2025-11-14 16:07:30,325 - INFO - Finished converting document 4_2023-06-29 in 0.08 sec.
2025-11-14 16:07:30,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,421 - INFO - Going to convert document batch...
2025-11-14 16:07:30,423 - INFO - Processing document 4_2023-09-19


Converted 'data\edgar_documents\COST\4_2023-06-26' --> 'data\processed_data\COST\4_2023-06-26.md'
Converted 'data\edgar_documents\COST\4_2023-06-29' --> 'data\processed_data\COST\4_2023-06-29.md'


2025-11-14 16:07:30,470 - INFO - Finished converting document 4_2023-09-19 in 0.09 sec.
2025-11-14 16:07:30,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,580 - INFO - Going to convert document batch...
2025-11-14 16:07:30,582 - INFO - Processing document 4_2023-09-28
2025-11-14 16:07:30,618 - INFO - Finished converting document 4_2023-09-28 in 0.08 sec.
2025-11-14 16:07:30,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,706 - INFO - Going to convert document batch...
2025-11-14 16:07:30,708 - INFO - Processing document 4_2023-10-11


Converted 'data\edgar_documents\COST\4_2023-09-19' --> 'data\processed_data\COST\4_2023-09-19.md'
Converted 'data\edgar_documents\COST\4_2023-09-28' --> 'data\processed_data\COST\4_2023-09-28.md'


2025-11-14 16:07:30,784 - INFO - Finished converting document 4_2023-10-11 in 0.12 sec.
2025-11-14 16:07:30,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,890 - INFO - Going to convert document batch...
2025-11-14 16:07:30,891 - INFO - Processing document 4_2023-10-12
2025-11-14 16:07:30,931 - INFO - Finished converting document 4_2023-10-12 in 0.08 sec.
2025-11-14 16:07:31,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2023-10-11' --> 'data\processed_data\COST\4_2023-10-11.md'
Converted 'data\edgar_documents\COST\4_2023-10-12' --> 'data\processed_data\COST\4_2023-10-12.md'


2025-11-14 16:07:31,060 - INFO - Going to convert document batch...
2025-11-14 16:07:31,062 - INFO - Processing document 4_2023-10-24
2025-11-14 16:07:31,137 - INFO - Finished converting document 4_2023-10-24 in 0.16 sec.
2025-11-14 16:07:31,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,220 - INFO - Going to convert document batch...
2025-11-14 16:07:31,222 - INFO - Processing document 4_2023-11-06
2025-11-14 16:07:31,268 - INFO - Finished converting document 4_2023-11-06 in 0.09 sec.
2025-11-14 16:07:31,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,350 - INFO - Going to convert document batch...
2025-11-14 16:07:31,352 - INFO - Processing document 4_2023-11-08


Converted 'data\edgar_documents\COST\4_2023-10-24' --> 'data\processed_data\COST\4_2023-10-24.md'
Converted 'data\edgar_documents\COST\4_2023-11-06' --> 'data\processed_data\COST\4_2023-11-06.md'


2025-11-14 16:07:31,386 - INFO - Finished converting document 4_2023-11-08 in 0.08 sec.
2025-11-14 16:07:31,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,462 - INFO - Going to convert document batch...
2025-11-14 16:07:31,463 - INFO - Processing document 4_2023-11-13
2025-11-14 16:07:31,509 - INFO - Finished converting document 4_2023-11-13 in 0.08 sec.
2025-11-14 16:07:31,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,593 - INFO - Going to convert document batch...
2025-11-14 16:07:31,594 - INFO - Processing document 4_2023-12-20


Converted 'data\edgar_documents\COST\4_2023-11-08' --> 'data\processed_data\COST\4_2023-11-08.md'
Converted 'data\edgar_documents\COST\4_2023-11-13' --> 'data\processed_data\COST\4_2023-11-13.md'


2025-11-14 16:07:31,665 - INFO - Finished converting document 4_2023-12-20 in 0.11 sec.
2025-11-14 16:07:31,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,769 - INFO - Going to convert document batch...
2025-11-14 16:07:31,770 - INFO - Processing document 4_2023-12-28
2025-11-14 16:07:31,811 - INFO - Finished converting document 4_2023-12-28 in 0.09 sec.
2025-11-14 16:07:31,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,890 - INFO - Going to convert document batch...
2025-11-14 16:07:31,892 - INFO - Processing document 4_2024-01-02


Converted 'data\edgar_documents\COST\4_2023-12-20' --> 'data\processed_data\COST\4_2023-12-20.md'
Converted 'data\edgar_documents\COST\4_2023-12-28' --> 'data\processed_data\COST\4_2023-12-28.md'


2025-11-14 16:07:31,932 - INFO - Finished converting document 4_2024-01-02 in 0.09 sec.
2025-11-14 16:07:32,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,025 - INFO - Going to convert document batch...
2025-11-14 16:07:32,026 - INFO - Processing document 4_2024-01-10
2025-11-14 16:07:32,068 - INFO - Finished converting document 4_2024-01-10 in 0.08 sec.
2025-11-14 16:07:32,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,147 - INFO - Going to convert document batch...
2025-11-14 16:07:32,149 - INFO - Processing document 4_2024-01-12
2025-11-14 16:07:32,187 - INFO - Finished converting document 4_2024-01-12 in 0.08 sec.


Converted 'data\edgar_documents\COST\4_2024-01-02' --> 'data\processed_data\COST\4_2024-01-02.md'
Converted 'data\edgar_documents\COST\4_2024-01-10' --> 'data\processed_data\COST\4_2024-01-10.md'


2025-11-14 16:07:32,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,249 - INFO - Going to convert document batch...
2025-11-14 16:07:32,250 - INFO - Processing document 4_2024-01-16
2025-11-14 16:07:32,289 - INFO - Finished converting document 4_2024-01-16 in 0.06 sec.
2025-11-14 16:07:32,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,362 - INFO - Going to convert document batch...
2025-11-14 16:07:32,364 - INFO - Processing document 4_2024-01-18
2025-11-14 16:07:32,398 - INFO - Finished converting document 4_2024-01-18 in 0.06 sec.


Converted 'data\edgar_documents\COST\4_2024-01-12' --> 'data\processed_data\COST\4_2024-01-12.md'
Converted 'data\edgar_documents\COST\4_2024-01-16' --> 'data\processed_data\COST\4_2024-01-16.md'


2025-11-14 16:07:32,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,475 - INFO - Going to convert document batch...
2025-11-14 16:07:32,477 - INFO - Processing document 4_2024-01-23
2025-11-14 16:07:32,536 - INFO - Finished converting document 4_2024-01-23 in 0.11 sec.
2025-11-14 16:07:32,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2024-01-18' --> 'data\processed_data\COST\4_2024-01-18.md'
Converted 'data\edgar_documents\COST\4_2024-01-23' --> 'data\processed_data\COST\4_2024-01-23.md'


2025-11-14 16:07:32,617 - INFO - Going to convert document batch...
2025-11-14 16:07:32,618 - INFO - Processing document 4_2024-02-12
2025-11-14 16:07:32,652 - INFO - Finished converting document 4_2024-02-12 in 0.08 sec.
2025-11-14 16:07:32,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,720 - INFO - Going to convert document batch...
2025-11-14 16:07:32,721 - INFO - Processing document 4_2024-02-22
2025-11-14 16:07:32,772 - INFO - Finished converting document 4_2024-02-22 in 0.08 sec.
2025-11-14 16:07:32,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,844 - INFO - Going to convert document batch...
2025-11-14 16:07:32,845 - INFO - Processing document 4_2024-03-13


Converted 'data\edgar_documents\COST\4_2024-02-12' --> 'data\processed_data\COST\4_2024-02-12.md'
Converted 'data\edgar_documents\COST\4_2024-02-22' --> 'data\processed_data\COST\4_2024-02-22.md'


2025-11-14 16:07:32,879 - INFO - Finished converting document 4_2024-03-13 in 0.06 sec.
2025-11-14 16:07:32,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,969 - INFO - Going to convert document batch...
2025-11-14 16:07:32,971 - INFO - Processing document 4_2024-04-09
2025-11-14 16:07:33,037 - INFO - Finished converting document 4_2024-04-09 in 0.11 sec.


Converted 'data\edgar_documents\COST\4_2024-03-13' --> 'data\processed_data\COST\4_2024-03-13.md'
Converted 'data\edgar_documents\COST\4_2024-04-09' --> 'data\processed_data\COST\4_2024-04-09.md'


2025-11-14 16:07:33,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,133 - INFO - Going to convert document batch...
2025-11-14 16:07:33,135 - INFO - Processing document 4_2024-04-18
2025-11-14 16:07:33,177 - INFO - Finished converting document 4_2024-04-18 in 0.09 sec.
2025-11-14 16:07:33,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,241 - INFO - Going to convert document batch...
2025-11-14 16:07:33,242 - INFO - Processing document 4_2024-07-15
2025-11-14 16:07:33,297 - INFO - Finished converting document 4_2024-07-15 in 0.09 sec.


Converted 'data\edgar_documents\COST\4_2024-04-18' --> 'data\processed_data\COST\4_2024-04-18.md'
Converted 'data\edgar_documents\COST\4_2024-07-15' --> 'data\processed_data\COST\4_2024-07-15.md'


2025-11-14 16:07:33,395 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,421 - INFO - Going to convert document batch...
2025-11-14 16:07:33,425 - INFO - Processing document 4_2024-07-17
2025-11-14 16:07:33,474 - INFO - Finished converting document 4_2024-07-17 in 0.09 sec.
2025-11-14 16:07:33,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,569 - INFO - Going to convert document batch...
2025-11-14 16:07:33,570 - INFO - Processing document 4_2024-07-22
2025-11-14 16:07:33,618 - INFO - Finished converting document 4_2024-07-22 in 0.08 sec.
2025-11-14 16:07:33,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,725 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COST\4_2024-07-17' --> 'data\processed_data\COST\4_2024-07-17.md'
Converted 'data\edgar_documents\COST\4_2024-07-22' --> 'data\processed_data\COST\4_2024-07-22.md'


2025-11-14 16:07:33,727 - INFO - Processing document 4_2024-08-15
2025-11-14 16:07:33,781 - INFO - Finished converting document 4_2024-08-15 in 0.12 sec.
2025-11-14 16:07:33,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,852 - INFO - Going to convert document batch...
2025-11-14 16:07:33,854 - INFO - Processing document 4_2024-08-29
2025-11-14 16:07:33,891 - INFO - Finished converting document 4_2024-08-29 in 0.06 sec.
2025-11-14 16:07:33,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,958 - INFO - Going to convert document batch...
2025-11-14 16:07:33,959 - INFO - Processing document 4_2024-09-18
2025-11-14 16:07:34,001 - INFO - Finished converting document 4_2024-09-18 in 0.08 sec.


Converted 'data\edgar_documents\COST\4_2024-08-15' --> 'data\processed_data\COST\4_2024-08-15.md'
Converted 'data\edgar_documents\COST\4_2024-08-29' --> 'data\processed_data\COST\4_2024-08-29.md'


2025-11-14 16:07:34,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,084 - INFO - Going to convert document batch...
2025-11-14 16:07:34,086 - INFO - Processing document 4_2024-09-26
2025-11-14 16:07:34,125 - INFO - Finished converting document 4_2024-09-26 in 0.08 sec.
2025-11-14 16:07:34,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,207 - INFO - Going to convert document batch...
2025-11-14 16:07:34,208 - INFO - Processing document 4_2024-10-02


Converted 'data\edgar_documents\COST\4_2024-09-18' --> 'data\processed_data\COST\4_2024-09-18.md'
Converted 'data\edgar_documents\COST\4_2024-09-26' --> 'data\processed_data\COST\4_2024-09-26.md'


2025-11-14 16:07:34,245 - INFO - Finished converting document 4_2024-10-02 in 0.09 sec.
2025-11-14 16:07:34,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,309 - INFO - Going to convert document batch...
2025-11-14 16:07:34,310 - INFO - Processing document 4_2024-10-15
2025-11-14 16:07:34,343 - INFO - Finished converting document 4_2024-10-15 in 0.06 sec.
2025-11-14 16:07:34,391 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,421 - INFO - Going to convert document batch...
2025-11-14 16:07:34,423 - INFO - Processing document 4_2024-10-24


Converted 'data\edgar_documents\COST\4_2024-10-02' --> 'data\processed_data\COST\4_2024-10-02.md'
Converted 'data\edgar_documents\COST\4_2024-10-15' --> 'data\processed_data\COST\4_2024-10-15.md'


2025-11-14 16:07:34,478 - INFO - Finished converting document 4_2024-10-24 in 0.09 sec.
2025-11-14 16:07:34,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,576 - INFO - Going to convert document batch...
2025-11-14 16:07:34,579 - INFO - Processing document 4_2024-12-18
2025-11-14 16:07:34,618 - INFO - Finished converting document 4_2024-12-18 in 0.09 sec.
2025-11-14 16:07:34,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,704 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COST\4_2024-10-24' --> 'data\processed_data\COST\4_2024-10-24.md'
Converted 'data\edgar_documents\COST\4_2024-12-18' --> 'data\processed_data\COST\4_2024-12-18.md'


2025-11-14 16:07:34,705 - INFO - Processing document 4_2024-12-23
2025-11-14 16:07:34,773 - INFO - Finished converting document 4_2024-12-23 in 0.11 sec.
2025-11-14 16:07:34,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,856 - INFO - Going to convert document batch...
2025-11-14 16:07:34,858 - INFO - Processing document 4_2025-03-13
2025-11-14 16:07:34,944 - INFO - Finished converting document 4_2025-03-13 in 0.12 sec.


Converted 'data\edgar_documents\COST\4_2024-12-23' --> 'data\processed_data\COST\4_2024-12-23.md'
Converted 'data\edgar_documents\COST\4_2025-03-13' --> 'data\processed_data\COST\4_2025-03-13.md'


2025-11-14 16:07:35,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,065 - INFO - Going to convert document batch...
2025-11-14 16:07:35,069 - INFO - Processing document 4_2025-03-20
2025-11-14 16:07:35,129 - INFO - Finished converting document 4_2025-03-20 in 0.12 sec.
2025-11-14 16:07:35,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,233 - INFO - Going to convert document batch...
2025-11-14 16:07:35,235 - INFO - Processing document 4_2025-03-25
2025-11-14 16:07:35,300 - INFO - Finished converting document 4_2025-03-25 in 0.11 sec.
2025-11-14 16:07:35,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2025-03-20' --> 'data\processed_data\COST\4_2025-03-20.md'
Converted 'data\edgar_documents\COST\4_2025-03-25' --> 'data\processed_data\COST\4_2025-03-25.md'


2025-11-14 16:07:35,404 - INFO - Going to convert document batch...
2025-11-14 16:07:35,406 - INFO - Processing document 4_2025-03-27
2025-11-14 16:07:35,453 - INFO - Finished converting document 4_2025-03-27 in 0.11 sec.
2025-11-14 16:07:35,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,525 - INFO - Going to convert document batch...
2025-11-14 16:07:35,526 - INFO - Processing document 4_2025-04-21
2025-11-14 16:07:35,562 - INFO - Finished converting document 4_2025-04-21 in 0.08 sec.
2025-11-14 16:07:35,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,646 - INFO - Going to convert document batch...
2025-11-14 16:07:35,649 - INFO - Processing document 4_2025-06-09
2025-11-14 16:07:35,709 - INFO - Finished converting document 4_2025-06-09 in 0.11 sec.


Converted 'data\edgar_documents\COST\4_2025-03-27' --> 'data\processed_data\COST\4_2025-03-27.md'
Converted 'data\edgar_documents\COST\4_2025-04-21' --> 'data\processed_data\COST\4_2025-04-21.md'


2025-11-14 16:07:35,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,822 - INFO - Going to convert document batch...
2025-11-14 16:07:35,824 - INFO - Processing document 4_2025-06-10
2025-11-14 16:07:35,861 - INFO - Finished converting document 4_2025-06-10 in 0.08 sec.
2025-11-14 16:07:35,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,947 - INFO - Going to convert document batch...
2025-11-14 16:07:35,948 - INFO - Processing document 4_2025-06-20


Converted 'data\edgar_documents\COST\4_2025-06-09' --> 'data\processed_data\COST\4_2025-06-09.md'
Converted 'data\edgar_documents\COST\4_2025-06-10' --> 'data\processed_data\COST\4_2025-06-10.md'


2025-11-14 16:07:36,041 - INFO - Finished converting document 4_2025-06-20 in 0.14 sec.
2025-11-14 16:07:36,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,125 - INFO - Going to convert document batch...
2025-11-14 16:07:36,126 - INFO - Processing document 4_2025-07-15
2025-11-14 16:07:36,184 - INFO - Finished converting document 4_2025-07-15 in 0.11 sec.
2025-11-14 16:07:36,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2025-06-20' --> 'data\processed_data\COST\4_2025-06-20.md'
Converted 'data\edgar_documents\COST\4_2025-07-15' --> 'data\processed_data\COST\4_2025-07-15.md'


2025-11-14 16:07:36,310 - INFO - Going to convert document batch...
2025-11-14 16:07:36,311 - INFO - Processing document 4_2025-08-22
2025-11-14 16:07:36,361 - INFO - Finished converting document 4_2025-08-22 in 0.11 sec.
2025-11-14 16:07:36,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,455 - INFO - Going to convert document batch...
2025-11-14 16:07:36,457 - INFO - Processing document 4_2025-09-04
2025-11-14 16:07:36,491 - INFO - Finished converting document 4_2025-09-04 in 0.06 sec.
2025-11-14 16:07:36,546 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,576 - INFO - Going to convert document batch...
2025-11-14 16:07:36,578 - INFO - Processing document 4_2025-09-12
2025-11-14 16:07:36,616 - INFO - Finished converting document 4_2025-09-12 in 0.08 sec.


Converted 'data\edgar_documents\COST\4_2025-08-22' --> 'data\processed_data\COST\4_2025-08-22.md'
Converted 'data\edgar_documents\COST\4_2025-09-04' --> 'data\processed_data\COST\4_2025-09-04.md'


2025-11-14 16:07:36,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,729 - INFO - Going to convert document batch...
2025-11-14 16:07:36,732 - INFO - Processing document 4_2025-09-24
2025-11-14 16:07:36,784 - INFO - Finished converting document 4_2025-09-24 in 0.09 sec.


Converted 'data\edgar_documents\COST\4_2025-09-12' --> 'data\processed_data\COST\4_2025-09-12.md'
Converted 'data\edgar_documents\COST\4_2025-09-24' --> 'data\processed_data\COST\4_2025-09-24.md'


2025-11-14 16:07:36,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,882 - INFO - Going to convert document batch...
2025-11-14 16:07:36,884 - INFO - Processing document 4_2025-09-30
2025-11-14 16:07:36,944 - INFO - Finished converting document 4_2025-09-30 in 0.11 sec.
2025-11-14 16:07:36,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2025-09-30' --> 'data\processed_data\COST\4_2025-09-30.md'


2025-11-14 16:07:37,754 - INFO - Going to convert document batch...
2025-11-14 16:07:37,756 - INFO - Processing document 4_2025-10-01
2025-11-14 16:07:37,803 - INFO - Finished converting document 4_2025-10-01 in 0.81 sec.
2025-11-14 16:07:37,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:37,977 - INFO - Going to convert document batch...
2025-11-14 16:07:37,978 - INFO - Processing document 4_2025-10-24
2025-11-14 16:07:38,014 - INFO - Finished converting document 4_2025-10-24 in 0.08 sec.
2025-11-14 16:07:38,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2025-10-01' --> 'data\processed_data\COST\4_2025-10-01.md'
Converted 'data\edgar_documents\COST\4_2025-10-24' --> 'data\processed_data\COST\4_2025-10-24.md'


2025-11-14 16:07:38,149 - INFO - Going to convert document batch...
2025-11-14 16:07:38,151 - INFO - Processing document 8-K_2023-01-19
2025-11-14 16:07:38,210 - INFO - Finished converting document 8-K_2023-01-19 in 0.12 sec.
2025-11-14 16:07:38,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:38,316 - INFO - Going to convert document batch...
2025-11-14 16:07:38,317 - INFO - Processing document 8-K_2023-01-25
2025-11-14 16:07:38,384 - INFO - Finished converting document 8-K_2023-01-25 in 0.14 sec.


Converted 'data\edgar_documents\COST\8-K_2023-01-19' --> 'data\processed_data\COST\8-K_2023-01-19.md'


2025-11-14 16:07:38,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:38,496 - INFO - Going to convert document batch...
2025-11-14 16:07:38,498 - INFO - Processing document 8-K_2023-03-03
2025-11-14 16:07:38,535 - INFO - Finished converting document 8-K_2023-03-03 in 0.11 sec.
2025-11-14 16:07:38,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:38,591 - INFO - Going to convert document batch...
2025-11-14 16:07:38,592 - INFO - Processing document 8-K_2023-04-19


Converted 'data\edgar_documents\COST\8-K_2023-01-25' --> 'data\processed_data\COST\8-K_2023-01-25.md'
Converted 'data\edgar_documents\COST\8-K_2023-03-03' --> 'data\processed_data\COST\8-K_2023-03-03.md'


2025-11-14 16:07:38,634 - INFO - Finished converting document 8-K_2023-04-19 in 0.08 sec.
2025-11-14 16:07:38,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:38,731 - INFO - Going to convert document batch...
2025-11-14 16:07:38,733 - INFO - Processing document 8-K_2023-05-25
2025-11-14 16:07:38,772 - INFO - Finished converting document 8-K_2023-05-25 in 0.11 sec.
2025-11-14 16:07:38,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\8-K_2023-04-19' --> 'data\processed_data\COST\8-K_2023-04-19.md'
Converted 'data\edgar_documents\COST\8-K_2023-05-25' --> 'data\processed_data\COST\8-K_2023-05-25.md'


2025-11-14 16:07:38,883 - INFO - Going to convert document batch...
2025-11-14 16:07:38,885 - INFO - Processing document 8-K_2023-08-10
2025-11-14 16:07:38,962 - INFO - Finished converting document 8-K_2023-08-10 in 0.16 sec.
2025-11-14 16:07:39,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,064 - INFO - Going to convert document batch...
2025-11-14 16:07:39,065 - INFO - Processing document 8-K_2023-08-17
2025-11-14 16:07:39,101 - INFO - Finished converting document 8-K_2023-08-17 in 0.09 sec.
2025-11-14 16:07:39,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\8-K_2023-08-10' --> 'data\processed_data\COST\8-K_2023-08-10.md'
Converted 'data\edgar_documents\COST\8-K_2023-08-17' --> 'data\processed_data\COST\8-K_2023-08-17.md'


2025-11-14 16:07:39,200 - INFO - Going to convert document batch...
2025-11-14 16:07:39,205 - INFO - Processing document 8-K_2023-09-26
2025-11-14 16:07:39,265 - INFO - Finished converting document 8-K_2023-09-26 in 0.14 sec.
2025-11-14 16:07:39,314 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,335 - INFO - Going to convert document batch...
2025-11-14 16:07:39,337 - INFO - Processing document 8-K_2023-10-20
2025-11-14 16:07:39,365 - INFO - Finished converting document 8-K_2023-10-20 in 0.08 sec.
2025-11-14 16:07:39,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,428 - INFO - Going to convert document batch...
2025-11-14 16:07:39,430 - INFO - Processing document 8-K_2023-11-24
2025-11-14 16:07:39,459 - INFO - Finished converting document 8-K_2023-11-24 in 0.08 sec.


Converted 'data\edgar_documents\COST\8-K_2023-09-26' --> 'data\processed_data\COST\8-K_2023-09-26.md'
Converted 'data\edgar_documents\COST\8-K_2023-10-20' --> 'data\processed_data\COST\8-K_2023-10-20.md'


2025-11-14 16:07:39,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,543 - INFO - Going to convert document batch...
2025-11-14 16:07:39,545 - INFO - Processing document 8-K_2023-12-14
2025-11-14 16:07:39,582 - INFO - Finished converting document 8-K_2023-12-14 in 0.11 sec.
2025-11-14 16:07:39,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,647 - INFO - Going to convert document batch...
2025-11-14 16:07:39,648 - INFO - Processing document 8-K_2024-01-22


Converted 'data\edgar_documents\COST\8-K_2023-11-24' --> 'data\processed_data\COST\8-K_2023-11-24.md'
Converted 'data\edgar_documents\COST\8-K_2023-12-14' --> 'data\processed_data\COST\8-K_2023-12-14.md'


2025-11-14 16:07:39,675 - INFO - Finished converting document 8-K_2024-01-22 in 0.08 sec.
2025-11-14 16:07:39,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,734 - INFO - Going to convert document batch...
2025-11-14 16:07:39,735 - INFO - Processing document 8-K_2024-02-09
2025-11-14 16:07:39,784 - INFO - Finished converting document 8-K_2024-02-09 in 0.09 sec.
2025-11-14 16:07:39,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,857 - INFO - Going to convert document batch...
2025-11-14 16:07:39,859 - INFO - Processing document 8-K_2024-03-07


Converted 'data\edgar_documents\COST\8-K_2024-01-22' --> 'data\processed_data\COST\8-K_2024-01-22.md'
Converted 'data\edgar_documents\COST\8-K_2024-02-09' --> 'data\processed_data\COST\8-K_2024-02-09.md'


2025-11-14 16:07:39,898 - INFO - Finished converting document 8-K_2024-03-07 in 0.09 sec.
2025-11-14 16:07:39,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,964 - INFO - Going to convert document batch...
2025-11-14 16:07:39,966 - INFO - Processing document 8-K_2024-04-10
2025-11-14 16:07:39,992 - INFO - Finished converting document 8-K_2024-04-10 in 0.05 sec.
2025-11-14 16:07:40,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,081 - INFO - Going to convert document batch...
2025-11-14 16:07:40,083 - INFO - Processing document 8-K_2024-05-30
2025-11-14 16:07:40,116 - INFO - Finished converting document 8-K_2024-05-30 in 0.09 sec.


Converted 'data\edgar_documents\COST\8-K_2024-03-07' --> 'data\processed_data\COST\8-K_2024-03-07.md'
Converted 'data\edgar_documents\COST\8-K_2024-04-10' --> 'data\processed_data\COST\8-K_2024-04-10.md'
Converted 'data\edgar_documents\COST\8-K_2024-05-30' --> 'data\processed_data\COST\8-K_2024-05-30.md'


2025-11-14 16:07:40,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,187 - INFO - Going to convert document batch...
2025-11-14 16:07:40,189 - INFO - Processing document 8-K_2024-07-10
2025-11-14 16:07:40,219 - INFO - Finished converting document 8-K_2024-07-10 in 0.09 sec.
2025-11-14 16:07:40,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,307 - INFO - Going to convert document batch...
2025-11-14 16:07:40,309 - INFO - Processing document 8-K_2024-09-20
2025-11-14 16:07:40,352 - INFO - Finished converting document 8-K_2024-09-20 in 0.09 sec.
2025-11-14 16:07:40,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\8-K_2024-07-10' --> 'data\processed_data\COST\8-K_2024-07-10.md'
Converted 'data\edgar_documents\COST\8-K_2024-09-20' --> 'data\processed_data\COST\8-K_2024-09-20.md'


2025-11-14 16:07:40,432 - INFO - Going to convert document batch...
2025-11-14 16:07:40,436 - INFO - Processing document 8-K_2024-09-26
2025-11-14 16:07:40,482 - INFO - Finished converting document 8-K_2024-09-26 in 0.11 sec.
2025-11-14 16:07:40,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,532 - INFO - Going to convert document batch...
2025-11-14 16:07:40,533 - INFO - Processing document 8-K_2024-10-17
2025-11-14 16:07:40,561 - INFO - Finished converting document 8-K_2024-10-17 in 0.06 sec.
2025-11-14 16:07:40,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,614 - INFO - Going to convert document batch...
2025-11-14 16:07:40,616 - INFO - Processing document 8-K_2024-11-07
2025-11-14 16:07:40,677 - INFO - Finished converting document 8-K_2024-11-07 in 0.09 sec.


Converted 'data\edgar_documents\COST\8-K_2024-09-26' --> 'data\processed_data\COST\8-K_2024-09-26.md'
Converted 'data\edgar_documents\COST\8-K_2024-10-17' --> 'data\processed_data\COST\8-K_2024-10-17.md'
Converted 'data\edgar_documents\COST\8-K_2024-11-07' --> 'data\processed_data\COST\8-K_2024-11-07.md'


2025-11-14 16:07:40,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,766 - INFO - Going to convert document batch...
2025-11-14 16:07:40,770 - INFO - Processing document 8-K_2024-12-12
2025-11-14 16:07:40,895 - INFO - Finished converting document 8-K_2024-12-12 in 0.20 sec.
2025-11-14 16:07:40,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,007 - INFO - Going to convert document batch...
2025-11-14 16:07:41,009 - INFO - Processing document 8-K_2025-01-27
2025-11-14 16:07:41,096 - INFO - Finished converting document 8-K_2025-01-27 in 0.17 sec.


Converted 'data\edgar_documents\COST\8-K_2024-12-12' --> 'data\processed_data\COST\8-K_2024-12-12.md'
Converted 'data\edgar_documents\COST\8-K_2025-01-27' --> 'data\processed_data\COST\8-K_2025-01-27.md'


2025-11-14 16:07:41,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,183 - INFO - Going to convert document batch...
2025-11-14 16:07:41,184 - INFO - Processing document 8-K_2025-02-03
2025-11-14 16:07:41,232 - INFO - Finished converting document 8-K_2025-02-03 in 0.09 sec.
2025-11-14 16:07:41,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,310 - INFO - Going to convert document batch...
2025-11-14 16:07:41,312 - INFO - Processing document 8-K_2025-03-06
2025-11-14 16:07:41,360 - INFO - Finished converting document 8-K_2025-03-06 in 0.09 sec.
2025-11-14 16:07:41,419 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\8-K_2025-02-03' --> 'data\processed_data\COST\8-K_2025-02-03.md'
Converted 'data\edgar_documents\COST\8-K_2025-03-06' --> 'data\processed_data\COST\8-K_2025-03-06.md'


2025-11-14 16:07:41,449 - INFO - Going to convert document batch...
2025-11-14 16:07:41,452 - INFO - Processing document 8-K_2025-04-16
2025-11-14 16:07:41,482 - INFO - Finished converting document 8-K_2025-04-16 in 0.09 sec.
2025-11-14 16:07:41,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,529 - INFO - Going to convert document batch...
2025-11-14 16:07:41,530 - INFO - Processing document 8-K_2025-05-29
2025-11-14 16:07:41,561 - INFO - Finished converting document 8-K_2025-05-29 in 0.06 sec.
2025-11-14 16:07:41,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,618 - INFO - Going to convert document batch...
2025-11-14 16:07:41,619 - INFO - Processing document 8-K_2025-06-11
2025-11-14 16:07:41,671 - INFO - Finished converting document 8-K_2025-06-11 in 0.09 sec.


Converted 'data\edgar_documents\COST\8-K_2025-04-16' --> 'data\processed_data\COST\8-K_2025-04-16.md'
Converted 'data\edgar_documents\COST\8-K_2025-05-29' --> 'data\processed_data\COST\8-K_2025-05-29.md'
Converted 'data\edgar_documents\COST\8-K_2025-06-11' --> 'data\processed_data\COST\8-K_2025-06-11.md'


2025-11-14 16:07:41,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,765 - INFO - Going to convert document batch...
2025-11-14 16:07:41,767 - INFO - Processing document 8-K_2025-07-16
2025-11-14 16:07:41,798 - INFO - Finished converting document 8-K_2025-07-16 in 0.09 sec.
2025-11-14 16:07:41,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,859 - INFO - Going to convert document batch...
2025-11-14 16:07:41,861 - INFO - Processing document 8-K_2025-08-07
2025-11-14 16:07:41,905 - INFO - Finished converting document 8-K_2025-08-07 in 0.09 sec.
2025-11-14 16:07:41,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,980 - INFO - Going to convert document batch...
2025-11-14 16:07:41,982 - INFO - Processing document 8-K_2025-09-25


Converted 'data\edgar_documents\COST\8-K_2025-07-16' --> 'data\processed_data\COST\8-K_2025-07-16.md'
Converted 'data\edgar_documents\COST\8-K_2025-08-07' --> 'data\processed_data\COST\8-K_2025-08-07.md'


2025-11-14 16:07:42,033 - INFO - Finished converting document 8-K_2025-09-25 in 0.09 sec.
2025-11-14 16:07:42,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:42,087 - INFO - Going to convert document batch...
2025-11-14 16:07:42,089 - INFO - Processing document 8-K_2025-10-15
2025-11-14 16:07:42,117 - INFO - Finished converting document 8-K_2025-10-15 in 0.06 sec.
2025-11-14 16:07:42,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:42,169 - INFO - Going to convert document batch...
2025-11-14 16:07:42,171 - INFO - Processing document 8-K_2025-10-20
2025-11-14 16:07:42,200 - INFO - Finished converting document 8-K_2025-10-20 in 0.06 sec.


Converted 'data\edgar_documents\COST\8-K_2025-09-25' --> 'data\processed_data\COST\8-K_2025-09-25.md'
Converted 'data\edgar_documents\COST\8-K_2025-10-15' --> 'data\processed_data\COST\8-K_2025-10-15.md'
Converted 'data\edgar_documents\COST\8-K_2025-10-20' --> 'data\processed_data\COST\8-K_2025-10-20.md'


2025-11-14 16:07:42,274 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:42,610 - INFO - Going to convert document batch...
2025-11-14 16:07:42,611 - INFO - Processing document DEF-14A_2023-12-07
2025-11-14 16:07:43,360 - INFO - Finished converting document DEF-14A_2023-12-07 in 1.14 sec.
2025-11-14 16:07:43,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\DEF-14A_2023-12-07' --> 'data\processed_data\COST\DEF-14A_2023-12-07.md'


2025-11-14 16:07:44,106 - INFO - Going to convert document batch...
2025-11-14 16:07:44,108 - INFO - Processing document DEF-14A_2024-12-11
2025-11-14 16:07:44,705 - INFO - Finished converting document DEF-14A_2024-12-11 in 1.02 sec.
2025-11-14 16:07:45,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\DEF-14A_2024-12-11' --> 'data\processed_data\COST\DEF-14A_2024-12-11.md'
Processed 104 new files. Errors: 0
Found 511 files to process in data\edgar_documents\CRM


2025-11-14 16:07:47,260 - INFO - Going to convert document batch...
2025-11-14 16:07:47,262 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:07:47,264 - INFO - Processing document 10-K_2023-03-08
2025-11-14 16:07:50,017 - INFO - Finished converting document 10-K_2023-03-08 in 4.98 sec.
2025-11-14 16:07:51,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-K_2023-03-08' --> 'data\processed_data\CRM\10-K_2023-03-08.md'


2025-11-14 16:07:53,370 - INFO - Going to convert document batch...
2025-11-14 16:07:53,372 - INFO - Processing document 10-K_2024-03-06
2025-11-14 16:07:56,385 - INFO - Finished converting document 10-K_2024-03-06 in 5.06 sec.
2025-11-14 16:07:57,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-K_2024-03-06' --> 'data\processed_data\CRM\10-K_2024-03-06.md'


2025-11-14 16:07:59,177 - INFO - Going to convert document batch...
2025-11-14 16:07:59,178 - INFO - Processing document 10-K_2025-03-05
2025-11-14 16:08:00,341 - INFO - Finished converting document 10-K_2025-03-05 in 2.53 sec.
2025-11-14 16:08:00,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-K_2025-03-05' --> 'data\processed_data\CRM\10-K_2025-03-05.md'


2025-11-14 16:08:01,220 - INFO - Going to convert document batch...
2025-11-14 16:08:01,221 - INFO - Processing document 10-Q_2023-06-01
2025-11-14 16:08:01,932 - INFO - Finished converting document 10-Q_2023-06-01 in 1.11 sec.
2025-11-14 16:08:02,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2023-06-01' --> 'data\processed_data\CRM\10-Q_2023-06-01.md'


2025-11-14 16:08:03,105 - INFO - Going to convert document batch...
2025-11-14 16:08:03,106 - INFO - Processing document 10-Q_2023-08-31
2025-11-14 16:08:03,930 - INFO - Finished converting document 10-Q_2023-08-31 in 1.28 sec.
2025-11-14 16:08:04,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2023-08-31' --> 'data\processed_data\CRM\10-Q_2023-08-31.md'


2025-11-14 16:08:05,154 - INFO - Going to convert document batch...
2025-11-14 16:08:05,155 - INFO - Processing document 10-Q_2023-11-30
2025-11-14 16:08:06,128 - INFO - Finished converting document 10-Q_2023-11-30 in 1.72 sec.
2025-11-14 16:08:06,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2023-11-30' --> 'data\processed_data\CRM\10-Q_2023-11-30.md'


2025-11-14 16:08:07,399 - INFO - Going to convert document batch...
2025-11-14 16:08:07,400 - INFO - Processing document 10-Q_2024-05-30
2025-11-14 16:08:08,233 - INFO - Finished converting document 10-Q_2024-05-30 in 1.62 sec.
2025-11-14 16:08:08,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2024-05-30' --> 'data\processed_data\CRM\10-Q_2024-05-30.md'


2025-11-14 16:08:09,296 - INFO - Going to convert document batch...
2025-11-14 16:08:09,298 - INFO - Processing document 10-Q_2024-08-29
2025-11-14 16:08:10,440 - INFO - Finished converting document 10-Q_2024-08-29 in 1.75 sec.
2025-11-14 16:08:11,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2024-08-29' --> 'data\processed_data\CRM\10-Q_2024-08-29.md'


2025-11-14 16:08:11,828 - INFO - Going to convert document batch...
2025-11-14 16:08:11,829 - INFO - Processing document 10-Q_2024-12-04
2025-11-14 16:08:12,817 - INFO - Finished converting document 10-Q_2024-12-04 in 1.83 sec.
2025-11-14 16:08:13,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2024-12-04' --> 'data\processed_data\CRM\10-Q_2024-12-04.md'


2025-11-14 16:08:14,003 - INFO - Going to convert document batch...
2025-11-14 16:08:14,004 - INFO - Processing document 10-Q_2025-05-29
2025-11-14 16:08:14,690 - INFO - Finished converting document 10-Q_2025-05-29 in 1.41 sec.
2025-11-14 16:08:15,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2025-05-29' --> 'data\processed_data\CRM\10-Q_2025-05-29.md'


2025-11-14 16:08:16,905 - INFO - Going to convert document batch...
2025-11-14 16:08:16,906 - INFO - Processing document 10-Q_2025-09-04
2025-11-14 16:08:19,765 - INFO - Finished converting document 10-Q_2025-09-04 in 4.06 sec.
2025-11-14 16:08:21,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,282 - INFO - Going to convert document batch...
2025-11-14 16:08:21,286 - INFO - Processing document 4_2023-01-04
2025-11-14 16:08:21,368 - INFO - Finished converting document 4_2023-01-04 in 0.25 sec.


Converted 'data\edgar_documents\CRM\10-Q_2025-09-04' --> 'data\processed_data\CRM\10-Q_2025-09-04.md'


2025-11-14 16:08:21,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,464 - INFO - Going to convert document batch...
2025-11-14 16:08:21,465 - INFO - Processing document 4_2023-01-05
2025-11-14 16:08:21,524 - INFO - Finished converting document 4_2023-01-05 in 0.09 sec.
2025-11-14 16:08:21,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,620 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-01-04' --> 'data\processed_data\CRM\4_2023-01-04.md'
Converted 'data\edgar_documents\CRM\4_2023-01-05' --> 'data\processed_data\CRM\4_2023-01-05.md'


2025-11-14 16:08:21,621 - INFO - Processing document 4_2023-01-09
2025-11-14 16:08:21,684 - INFO - Finished converting document 4_2023-01-09 in 0.11 sec.
2025-11-14 16:08:21,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,783 - INFO - Going to convert document batch...
2025-11-14 16:08:21,784 - INFO - Processing document 4_2023-01-10
2025-11-14 16:08:21,848 - INFO - Finished converting document 4_2023-01-10 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-01-09' --> 'data\processed_data\CRM\4_2023-01-09.md'
Converted 'data\edgar_documents\CRM\4_2023-01-10' --> 'data\processed_data\CRM\4_2023-01-10.md'


2025-11-14 16:08:21,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,965 - INFO - Going to convert document batch...
2025-11-14 16:08:21,967 - INFO - Processing document 4_2023-01-11
2025-11-14 16:08:22,016 - INFO - Finished converting document 4_2023-01-11 in 0.11 sec.
2025-11-14 16:08:22,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,101 - INFO - Going to convert document batch...
2025-11-14 16:08:22,102 - INFO - Processing document 4_2023-01-12
2025-11-14 16:08:22,153 - INFO - Finished converting document 4_2023-01-12 in 0.09 sec.
2025-11-14 16:08:22,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-01-11' --> 'data\processed_data\CRM\4_2023-01-11.md'
Converted 'data\edgar_documents\CRM\4_2023-01-12' --> 'data\processed_data\CRM\4_2023-01-12.md'


2025-11-14 16:08:22,276 - INFO - Going to convert document batch...
2025-11-14 16:08:22,278 - INFO - Processing document 4_2023-01-13
2025-11-14 16:08:22,346 - INFO - Finished converting document 4_2023-01-13 in 0.12 sec.
2025-11-14 16:08:22,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,435 - INFO - Going to convert document batch...
2025-11-14 16:08:22,435 - INFO - Processing document 4_2023-01-18
2025-11-14 16:08:22,494 - INFO - Finished converting document 4_2023-01-18 in 0.11 sec.
2025-11-14 16:08:22,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,586 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-01-13' --> 'data\processed_data\CRM\4_2023-01-13.md'
Converted 'data\edgar_documents\CRM\4_2023-01-18' --> 'data\processed_data\CRM\4_2023-01-18.md'


2025-11-14 16:08:22,588 - INFO - Processing document 4_2023-01-19
2025-11-14 16:08:22,647 - INFO - Finished converting document 4_2023-01-19 in 0.09 sec.
2025-11-14 16:08:22,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,745 - INFO - Going to convert document batch...
2025-11-14 16:08:22,747 - INFO - Processing document 4_2023-01-20
2025-11-14 16:08:22,844 - INFO - Finished converting document 4_2023-01-20 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-01-19' --> 'data\processed_data\CRM\4_2023-01-19.md'


2025-11-14 16:08:22,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,978 - INFO - Going to convert document batch...
2025-11-14 16:08:22,980 - INFO - Processing document 4_2023-01-23
2025-11-14 16:08:23,046 - INFO - Finished converting document 4_2023-01-23 in 0.14 sec.
2025-11-14 16:08:23,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-01-20' --> 'data\processed_data\CRM\4_2023-01-20.md'
Converted 'data\edgar_documents\CRM\4_2023-01-23' --> 'data\processed_data\CRM\4_2023-01-23.md'


2025-11-14 16:08:23,132 - INFO - Going to convert document batch...
2025-11-14 16:08:23,133 - INFO - Processing document 4_2023-01-24
2025-11-14 16:08:23,203 - INFO - Finished converting document 4_2023-01-24 in 0.12 sec.
2025-11-14 16:08:23,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:23,346 - INFO - Going to convert document batch...
2025-11-14 16:08:23,346 - INFO - Processing document 4_2023-01-25
2025-11-14 16:08:23,407 - INFO - Finished converting document 4_2023-01-25 in 0.11 sec.
2025-11-14 16:08:23,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-01-24' --> 'data\processed_data\CRM\4_2023-01-24.md'
Converted 'data\edgar_documents\CRM\4_2023-01-25' --> 'data\processed_data\CRM\4_2023-01-25.md'


2025-11-14 16:08:23,516 - INFO - Going to convert document batch...
2025-11-14 16:08:23,516 - INFO - Processing document 4_2023-01-27
2025-11-14 16:08:23,614 - INFO - Finished converting document 4_2023-01-27 in 0.16 sec.
2025-11-14 16:08:23,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:23,744 - INFO - Going to convert document batch...
2025-11-14 16:08:23,746 - INFO - Processing document 4_2023-01-30
2025-11-14 16:08:23,804 - INFO - Finished converting document 4_2023-01-30 in 0.11 sec.
2025-11-14 16:08:23,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:23,892 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-01-27' --> 'data\processed_data\CRM\4_2023-01-27.md'
Converted 'data\edgar_documents\CRM\4_2023-01-30' --> 'data\processed_data\CRM\4_2023-01-30.md'


2025-11-14 16:08:23,894 - INFO - Processing document 4_2023-01-31
2025-11-14 16:08:23,944 - INFO - Finished converting document 4_2023-01-31 in 0.09 sec.
2025-11-14 16:08:24,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:24,027 - INFO - Going to convert document batch...
2025-11-14 16:08:24,028 - INFO - Processing document 4_2023-02-01
2025-11-14 16:08:24,086 - INFO - Finished converting document 4_2023-02-01 in 0.09 sec.
2025-11-14 16:08:24,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-01-31' --> 'data\processed_data\CRM\4_2023-01-31.md'
Converted 'data\edgar_documents\CRM\4_2023-02-01' --> 'data\processed_data\CRM\4_2023-02-01.md'


2025-11-14 16:08:24,195 - INFO - Going to convert document batch...
2025-11-14 16:08:24,197 - INFO - Processing document 4_2023-02-02
2025-11-14 16:08:24,292 - INFO - Finished converting document 4_2023-02-02 in 0.17 sec.
2025-11-14 16:08:24,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:24,411 - INFO - Going to convert document batch...
2025-11-14 16:08:24,412 - INFO - Processing document 4_2023-02-03
2025-11-14 16:08:24,470 - INFO - Finished converting document 4_2023-02-03 in 0.09 sec.
2025-11-14 16:08:24,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-02-02' --> 'data\processed_data\CRM\4_2023-02-02.md'
Converted 'data\edgar_documents\CRM\4_2023-02-03' --> 'data\processed_data\CRM\4_2023-02-03.md'


2025-11-14 16:08:24,570 - INFO - Going to convert document batch...
2025-11-14 16:08:24,574 - INFO - Processing document 4_2023-02-06
2025-11-14 16:08:24,629 - INFO - Finished converting document 4_2023-02-06 in 0.11 sec.
2025-11-14 16:08:24,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:24,726 - INFO - Going to convert document batch...
2025-11-14 16:08:24,727 - INFO - Processing document 4_2023-02-07
2025-11-14 16:08:24,780 - INFO - Finished converting document 4_2023-02-07 in 0.11 sec.
2025-11-14 16:08:24,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-02-06' --> 'data\processed_data\CRM\4_2023-02-06.md'
Converted 'data\edgar_documents\CRM\4_2023-02-07' --> 'data\processed_data\CRM\4_2023-02-07.md'


2025-11-14 16:08:24,909 - INFO - Going to convert document batch...
2025-11-14 16:08:24,912 - INFO - Processing document 4_2023-02-08
2025-11-14 16:08:24,985 - INFO - Finished converting document 4_2023-02-08 in 0.14 sec.
2025-11-14 16:08:25,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:25,120 - INFO - Going to convert document batch...
2025-11-14 16:08:25,122 - INFO - Processing document 4_2023-02-09
2025-11-14 16:08:25,169 - INFO - Finished converting document 4_2023-02-09 in 0.09 sec.
2025-11-14 16:08:25,238 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:25,262 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-02-08' --> 'data\processed_data\CRM\4_2023-02-08.md'
Converted 'data\edgar_documents\CRM\4_2023-02-09' --> 'data\processed_data\CRM\4_2023-02-09.md'


2025-11-14 16:08:25,263 - INFO - Processing document 4_2023-02-10
2025-11-14 16:08:25,318 - INFO - Finished converting document 4_2023-02-10 in 0.09 sec.
2025-11-14 16:08:25,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:25,401 - INFO - Going to convert document batch...
2025-11-14 16:08:25,402 - INFO - Processing document 4_2023-02-13
2025-11-14 16:08:25,452 - INFO - Finished converting document 4_2023-02-13 in 0.09 sec.
2025-11-14 16:08:25,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-02-10' --> 'data\processed_data\CRM\4_2023-02-10.md'
Converted 'data\edgar_documents\CRM\4_2023-02-13' --> 'data\processed_data\CRM\4_2023-02-13.md'


2025-11-14 16:08:25,594 - INFO - Going to convert document batch...
2025-11-14 16:08:25,595 - INFO - Processing document 4_2023-02-14
2025-11-14 16:08:25,685 - INFO - Finished converting document 4_2023-02-14 in 0.16 sec.
2025-11-14 16:08:25,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:25,768 - INFO - Going to convert document batch...
2025-11-14 16:08:25,769 - INFO - Processing document 4_2023-02-15
2025-11-14 16:08:25,863 - INFO - Finished converting document 4_2023-02-15 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-02-14' --> 'data\processed_data\CRM\4_2023-02-14.md'


2025-11-14 16:08:25,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,037 - INFO - Going to convert document batch...
2025-11-14 16:08:26,039 - INFO - Processing document 4_2023-02-16
2025-11-14 16:08:26,133 - INFO - Finished converting document 4_2023-02-16 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2023-02-15' --> 'data\processed_data\CRM\4_2023-02-15.md'


2025-11-14 16:08:26,198 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,213 - INFO - Going to convert document batch...
2025-11-14 16:08:26,214 - INFO - Processing document 4_2023-02-17
2025-11-14 16:08:26,251 - INFO - Finished converting document 4_2023-02-17 in 0.06 sec.
2025-11-14 16:08:26,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,325 - INFO - Going to convert document batch...
2025-11-14 16:08:26,326 - INFO - Processing document 4_2023-02-21
2025-11-14 16:08:26,381 - INFO - Finished converting document 4_2023-02-21 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-02-16' --> 'data\processed_data\CRM\4_2023-02-16.md'
Converted 'data\edgar_documents\CRM\4_2023-02-17' --> 'data\processed_data\CRM\4_2023-02-17.md'


2025-11-14 16:08:26,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,501 - INFO - Going to convert document batch...
2025-11-14 16:08:26,502 - INFO - Processing document 4_2023-02-22
2025-11-14 16:08:26,577 - INFO - Finished converting document 4_2023-02-22 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-02-21' --> 'data\processed_data\CRM\4_2023-02-21.md'
Converted 'data\edgar_documents\CRM\4_2023-02-22' --> 'data\processed_data\CRM\4_2023-02-22.md'


2025-11-14 16:08:26,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,674 - INFO - Going to convert document batch...
2025-11-14 16:08:26,675 - INFO - Processing document 4_2023-02-23
2025-11-14 16:08:26,717 - INFO - Finished converting document 4_2023-02-23 in 0.09 sec.
2025-11-14 16:08:26,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,791 - INFO - Going to convert document batch...
2025-11-14 16:08:26,792 - INFO - Processing document 4_2023-02-24
2025-11-14 16:08:26,843 - INFO - Finished converting document 4_2023-02-24 in 0.09 sec.
2025-11-14 16:08:26,906 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,932 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-02-23' --> 'data\processed_data\CRM\4_2023-02-23.md'
Converted 'data\edgar_documents\CRM\4_2023-02-24' --> 'data\processed_data\CRM\4_2023-02-24.md'


2025-11-14 16:08:26,933 - INFO - Processing document 4_2023-02-27
2025-11-14 16:08:26,985 - INFO - Finished converting document 4_2023-02-27 in 0.09 sec.
2025-11-14 16:08:27,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:27,066 - INFO - Going to convert document batch...
2025-11-14 16:08:27,067 - INFO - Processing document 4_2023-02-28
2025-11-14 16:08:27,116 - INFO - Finished converting document 4_2023-02-28 in 0.08 sec.
2025-11-14 16:08:27,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-02-27' --> 'data\processed_data\CRM\4_2023-02-27.md'
Converted 'data\edgar_documents\CRM\4_2023-02-28' --> 'data\processed_data\CRM\4_2023-02-28.md'


2025-11-14 16:08:27,257 - INFO - Going to convert document batch...
2025-11-14 16:08:27,259 - INFO - Processing document 4_2023-03-01
2025-11-14 16:08:27,424 - INFO - Finished converting document 4_2023-03-01 in 0.25 sec.
2025-11-14 16:08:27,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:27,556 - INFO - Going to convert document batch...
2025-11-14 16:08:27,557 - INFO - Processing document 4_2023-03-02
2025-11-14 16:08:27,668 - INFO - Finished converting document 4_2023-03-02 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-01' --> 'data\processed_data\CRM\4_2023-03-01.md'


2025-11-14 16:08:27,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:27,822 - INFO - Going to convert document batch...
2025-11-14 16:08:27,823 - INFO - Processing document 4_2023-03-03
2025-11-14 16:08:27,904 - INFO - Finished converting document 4_2023-03-03 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-02' --> 'data\processed_data\CRM\4_2023-03-02.md'


2025-11-14 16:08:28,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,070 - INFO - Going to convert document batch...
2025-11-14 16:08:28,072 - INFO - Processing document 4_2023-03-06
2025-11-14 16:08:28,173 - INFO - Finished converting document 4_2023-03-06 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-03' --> 'data\processed_data\CRM\4_2023-03-03.md'


2025-11-14 16:08:28,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,337 - INFO - Going to convert document batch...
2025-11-14 16:08:28,339 - INFO - Processing document 4_2023-03-07
2025-11-14 16:08:28,409 - INFO - Finished converting document 4_2023-03-07 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-06' --> 'data\processed_data\CRM\4_2023-03-06.md'
Converted 'data\edgar_documents\CRM\4_2023-03-07' --> 'data\processed_data\CRM\4_2023-03-07.md'


2025-11-14 16:08:28,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,523 - INFO - Going to convert document batch...
2025-11-14 16:08:28,524 - INFO - Processing document 4_2023-03-08
2025-11-14 16:08:28,575 - INFO - Finished converting document 4_2023-03-08 in 0.11 sec.
2025-11-14 16:08:28,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,658 - INFO - Going to convert document batch...
2025-11-14 16:08:28,659 - INFO - Processing document 4_2023-03-09
2025-11-14 16:08:28,709 - INFO - Finished converting document 4_2023-03-09 in 0.08 sec.
2025-11-14 16:08:28,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,797 - INFO - Going to convert document batch...
2025-11-14 16:08:28,798 - INFO - Processing document 4_2023-03-10
2025-11-14 16:08:28,831 - INFO - Finished converting document 4_2023-03-10 in 0.08 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-08' --> 'data\processed_data\CRM\4_2023-03-08.md'
Converted 'data\edgar_documents\CRM\4_2023-03-09' --> 'data\processed_data\CRM\4_2023-03-09.md'


2025-11-14 16:08:28,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,908 - INFO - Going to convert document batch...
2025-11-14 16:08:28,910 - INFO - Processing document 4_2023-03-13


Converted 'data\edgar_documents\CRM\4_2023-03-10' --> 'data\processed_data\CRM\4_2023-03-10.md'


2025-11-14 16:08:30,002 - INFO - Finished converting document 4_2023-03-13 in 1.14 sec.
2025-11-14 16:08:30,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:30,204 - INFO - Going to convert document batch...
2025-11-14 16:08:30,207 - INFO - Processing document 4_2023-03-14
2025-11-14 16:08:30,282 - INFO - Finished converting document 4_2023-03-14 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-13' --> 'data\processed_data\CRM\4_2023-03-13.md'


2025-11-14 16:08:30,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:30,439 - INFO - Going to convert document batch...
2025-11-14 16:08:30,441 - INFO - Processing document 4_2023-03-15
2025-11-14 16:08:30,539 - INFO - Finished converting document 4_2023-03-15 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-14' --> 'data\processed_data\CRM\4_2023-03-14.md'


2025-11-14 16:08:30,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:30,685 - INFO - Going to convert document batch...
2025-11-14 16:08:30,689 - INFO - Processing document 4_2023-03-16


Converted 'data\edgar_documents\CRM\4_2023-03-15' --> 'data\processed_data\CRM\4_2023-03-15.md'


2025-11-14 16:08:30,853 - INFO - Finished converting document 4_2023-03-16 in 0.22 sec.
2025-11-14 16:08:30,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:30,974 - INFO - Going to convert document batch...
2025-11-14 16:08:30,976 - INFO - Processing document 4_2023-03-17
2025-11-14 16:08:31,031 - INFO - Finished converting document 4_2023-03-17 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-16' --> 'data\processed_data\CRM\4_2023-03-16.md'
Converted 'data\edgar_documents\CRM\4_2023-03-17' --> 'data\processed_data\CRM\4_2023-03-17.md'


2025-11-14 16:08:31,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:31,170 - INFO - Going to convert document batch...
2025-11-14 16:08:31,172 - INFO - Processing document 4_2023-03-20
2025-11-14 16:08:31,223 - INFO - Finished converting document 4_2023-03-20 in 0.11 sec.
2025-11-14 16:08:31,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:31,365 - INFO - Going to convert document batch...
2025-11-14 16:08:31,366 - INFO - Processing document 4_2023-03-21
2025-11-14 16:08:31,430 - INFO - Finished converting document 4_2023-03-21 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-20' --> 'data\processed_data\CRM\4_2023-03-20.md'
Converted 'data\edgar_documents\CRM\4_2023-03-21' --> 'data\processed_data\CRM\4_2023-03-21.md'


2025-11-14 16:08:31,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:31,573 - INFO - Going to convert document batch...
2025-11-14 16:08:31,575 - INFO - Processing document 4_2023-03-22
2025-11-14 16:08:31,650 - INFO - Finished converting document 4_2023-03-22 in 0.14 sec.
2025-11-14 16:08:31,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:31,808 - INFO - Going to convert document batch...
2025-11-14 16:08:31,809 - INFO - Processing document 4_2023-03-23
2025-11-14 16:08:31,916 - INFO - Finished converting document 4_2023-03-23 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-22' --> 'data\processed_data\CRM\4_2023-03-22.md'


2025-11-14 16:08:32,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,019 - INFO - Going to convert document batch...
2025-11-14 16:08:32,022 - INFO - Processing document 4_2023-03-24
2025-11-14 16:08:32,073 - INFO - Finished converting document 4_2023-03-24 in 0.09 sec.
2025-11-14 16:08:32,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,188 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-03-23' --> 'data\processed_data\CRM\4_2023-03-23.md'
Converted 'data\edgar_documents\CRM\4_2023-03-24' --> 'data\processed_data\CRM\4_2023-03-24.md'


2025-11-14 16:08:32,189 - INFO - Processing document 4_2023-03-27
2025-11-14 16:08:32,256 - INFO - Finished converting document 4_2023-03-27 in 0.11 sec.
2025-11-14 16:08:32,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,350 - INFO - Going to convert document batch...
2025-11-14 16:08:32,351 - INFO - Processing document 4_2023-03-28
2025-11-14 16:08:32,430 - INFO - Finished converting document 4_2023-03-28 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-27' --> 'data\processed_data\CRM\4_2023-03-27.md'


2025-11-14 16:08:32,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,605 - INFO - Going to convert document batch...
2025-11-14 16:08:32,608 - INFO - Processing document 4_2023-03-29
2025-11-14 16:08:32,679 - INFO - Finished converting document 4_2023-03-29 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-28' --> 'data\processed_data\CRM\4_2023-03-28.md'


2025-11-14 16:08:32,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,859 - INFO - Going to convert document batch...
2025-11-14 16:08:32,861 - INFO - Processing document 4_2023-03-30
2025-11-14 16:08:32,985 - INFO - Finished converting document 4_2023-03-30 in 0.20 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-29' --> 'data\processed_data\CRM\4_2023-03-29.md'


2025-11-14 16:08:33,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:33,109 - INFO - Going to convert document batch...
2025-11-14 16:08:33,110 - INFO - Processing document 4_2023-04-03
2025-11-14 16:08:33,231 - INFO - Finished converting document 4_2023-04-03 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-30' --> 'data\processed_data\CRM\4_2023-03-30.md'


2025-11-14 16:08:33,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:33,443 - INFO - Going to convert document batch...
2025-11-14 16:08:33,445 - INFO - Processing document 4_2023-04-05
2025-11-14 16:08:33,547 - INFO - Finished converting document 4_2023-04-05 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-04-03' --> 'data\processed_data\CRM\4_2023-04-03.md'


2025-11-14 16:08:33,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:33,712 - INFO - Going to convert document batch...
2025-11-14 16:08:33,713 - INFO - Processing document 4_2023-04-11
2025-11-14 16:08:33,764 - INFO - Finished converting document 4_2023-04-11 in 0.09 sec.
2025-11-14 16:08:33,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:33,863 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-04-05' --> 'data\processed_data\CRM\4_2023-04-05.md'
Converted 'data\edgar_documents\CRM\4_2023-04-11' --> 'data\processed_data\CRM\4_2023-04-11.md'


2025-11-14 16:08:33,865 - INFO - Processing document 4_2023-04-12
2025-11-14 16:08:33,928 - INFO - Finished converting document 4_2023-04-12 in 0.11 sec.
2025-11-14 16:08:34,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:34,031 - INFO - Going to convert document batch...
2025-11-14 16:08:34,033 - INFO - Processing document 4_2023-04-19
2025-11-14 16:08:34,097 - INFO - Finished converting document 4_2023-04-19 in 0.11 sec.
2025-11-14 16:08:34,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-04-12' --> 'data\processed_data\CRM\4_2023-04-12.md'
Converted 'data\edgar_documents\CRM\4_2023-04-19' --> 'data\processed_data\CRM\4_2023-04-19.md'


2025-11-14 16:08:34,214 - INFO - Going to convert document batch...
2025-11-14 16:08:34,215 - INFO - Processing document 4_2023-04-24
2025-11-14 16:08:34,280 - INFO - Finished converting document 4_2023-04-24 in 0.12 sec.
2025-11-14 16:08:34,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:34,409 - INFO - Going to convert document batch...
2025-11-14 16:08:34,410 - INFO - Processing document 4_2023-04-26
2025-11-14 16:08:34,464 - INFO - Finished converting document 4_2023-04-26 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-04-24' --> 'data\processed_data\CRM\4_2023-04-24.md'
Converted 'data\edgar_documents\CRM\4_2023-04-26' --> 'data\processed_data\CRM\4_2023-04-26.md'


2025-11-14 16:08:34,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:34,621 - INFO - Going to convert document batch...
2025-11-14 16:08:34,622 - INFO - Processing document 4_2023-05-03
2025-11-14 16:08:34,709 - INFO - Finished converting document 4_2023-05-03 in 0.17 sec.
2025-11-14 16:08:34,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:34,824 - INFO - Going to convert document batch...
2025-11-14 16:08:34,825 - INFO - Processing document 4_2023-05-10
2025-11-14 16:08:34,916 - INFO - Finished converting document 4_2023-05-10 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-05-03' --> 'data\processed_data\CRM\4_2023-05-03.md'


2025-11-14 16:08:35,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:35,060 - INFO - Going to convert document batch...
2025-11-14 16:08:35,062 - INFO - Processing document 4_2023-05-17
2025-11-14 16:08:35,144 - INFO - Finished converting document 4_2023-05-17 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-05-10' --> 'data\processed_data\CRM\4_2023-05-10.md'
Converted 'data\edgar_documents\CRM\4_2023-05-17' --> 'data\processed_data\CRM\4_2023-05-17.md'


2025-11-14 16:08:35,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:35,283 - INFO - Going to convert document batch...
2025-11-14 16:08:35,284 - INFO - Processing document 4_2023-05-23
2025-11-14 16:08:35,416 - INFO - Finished converting document 4_2023-05-23 in 0.20 sec.
2025-11-14 16:08:35,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:35,557 - INFO - Going to convert document batch...
2025-11-14 16:08:35,558 - INFO - Processing document 4_2023-05-24
2025-11-14 16:08:35,615 - INFO - Finished converting document 4_2023-05-24 in 0.09 sec.
2025-11-14 16:08:35,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-05-23' --> 'data\processed_data\CRM\4_2023-05-23.md'
Converted 'data\edgar_documents\CRM\4_2023-05-24' --> 'data\processed_data\CRM\4_2023-05-24.md'


2025-11-14 16:08:35,748 - INFO - Going to convert document batch...
2025-11-14 16:08:35,752 - INFO - Processing document 4_2023-05-31
2025-11-14 16:08:35,818 - INFO - Finished converting document 4_2023-05-31 in 0.14 sec.
2025-11-14 16:08:35,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:35,938 - INFO - Going to convert document batch...
2025-11-14 16:08:35,940 - INFO - Processing document 4_2023-06-01
2025-11-14 16:08:35,996 - INFO - Finished converting document 4_2023-06-01 in 0.11 sec.
2025-11-14 16:08:36,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-05-31' --> 'data\processed_data\CRM\4_2023-05-31.md'
Converted 'data\edgar_documents\CRM\4_2023-06-01' --> 'data\processed_data\CRM\4_2023-06-01.md'


2025-11-14 16:08:36,117 - INFO - Going to convert document batch...
2025-11-14 16:08:36,117 - INFO - Processing document 4_2023-06-06
2025-11-14 16:08:36,173 - INFO - Finished converting document 4_2023-06-06 in 0.12 sec.
2025-11-14 16:08:36,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:36,293 - INFO - Going to convert document batch...
2025-11-14 16:08:36,296 - INFO - Processing document 4_2023-06-07
2025-11-14 16:08:36,379 - INFO - Finished converting document 4_2023-06-07 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-06' --> 'data\processed_data\CRM\4_2023-06-06.md'


2025-11-14 16:08:36,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:36,536 - INFO - Going to convert document batch...
2025-11-14 16:08:36,537 - INFO - Processing document 4_2023-06-09
2025-11-14 16:08:36,589 - INFO - Finished converting document 4_2023-06-09 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-07' --> 'data\processed_data\CRM\4_2023-06-07.md'
Converted 'data\edgar_documents\CRM\4_2023-06-09' --> 'data\processed_data\CRM\4_2023-06-09.md'


2025-11-14 16:08:36,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:36,769 - INFO - Going to convert document batch...
2025-11-14 16:08:36,771 - INFO - Processing document 4_2023-06-14
2025-11-14 16:08:36,928 - INFO - Finished converting document 4_2023-06-14 in 0.25 sec.
2025-11-14 16:08:37,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:37,044 - INFO - Going to convert document batch...
2025-11-14 16:08:37,046 - INFO - Processing document 4_2023-06-16
2025-11-14 16:08:37,122 - INFO - Finished converting document 4_2023-06-16 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-14' --> 'data\processed_data\CRM\4_2023-06-14.md'


2025-11-14 16:08:37,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:37,300 - INFO - Going to convert document batch...
2025-11-14 16:08:37,302 - INFO - Processing document 4_2023-06-20
2025-11-14 16:08:37,376 - INFO - Finished converting document 4_2023-06-20 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-16' --> 'data\processed_data\CRM\4_2023-06-16.md'


2025-11-14 16:08:37,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:37,509 - INFO - Going to convert document batch...
2025-11-14 16:08:37,510 - INFO - Processing document 4_2023-06-21


Converted 'data\edgar_documents\CRM\4_2023-06-20' --> 'data\processed_data\CRM\4_2023-06-20.md'


2025-11-14 16:08:38,057 - INFO - Finished converting document 4_2023-06-21 in 0.62 sec.
2025-11-14 16:08:38,215 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,262 - INFO - Going to convert document batch...
2025-11-14 16:08:38,264 - INFO - Processing document 4_2023-06-23
2025-11-14 16:08:38,336 - INFO - Finished converting document 4_2023-06-23 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-21' --> 'data\processed_data\CRM\4_2023-06-21.md'


2025-11-14 16:08:38,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,427 - INFO - Going to convert document batch...
2025-11-14 16:08:38,429 - INFO - Processing document 4_2023-06-27
2025-11-14 16:08:38,472 - INFO - Finished converting document 4_2023-06-27 in 0.08 sec.
2025-11-14 16:08:38,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,578 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-06-23' --> 'data\processed_data\CRM\4_2023-06-23.md'
Converted 'data\edgar_documents\CRM\4_2023-06-27' --> 'data\processed_data\CRM\4_2023-06-27.md'


2025-11-14 16:08:38,579 - INFO - Processing document 4_2023-06-28
2025-11-14 16:08:38,644 - INFO - Finished converting document 4_2023-06-28 in 0.12 sec.
2025-11-14 16:08:38,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,764 - INFO - Going to convert document batch...
2025-11-14 16:08:38,766 - INFO - Processing document 4_2023-06-30
2025-11-14 16:08:38,809 - INFO - Finished converting document 4_2023-06-30 in 0.08 sec.
2025-11-14 16:08:38,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,956 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-06-28' --> 'data\processed_data\CRM\4_2023-06-28.md'
Converted 'data\edgar_documents\CRM\4_2023-06-30' --> 'data\processed_data\CRM\4_2023-06-30.md'


2025-11-14 16:08:38,957 - INFO - Processing document 4_2023-07-03
2025-11-14 16:08:39,036 - INFO - Finished converting document 4_2023-07-03 in 0.16 sec.
2025-11-14 16:08:39,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:39,166 - INFO - Going to convert document batch...
2025-11-14 16:08:39,167 - INFO - Processing document 4_2023-07-05
2025-11-14 16:08:39,216 - INFO - Finished converting document 4_2023-07-05 in 0.09 sec.
2025-11-14 16:08:39,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-07-03' --> 'data\processed_data\CRM\4_2023-07-03.md'
Converted 'data\edgar_documents\CRM\4_2023-07-05' --> 'data\processed_data\CRM\4_2023-07-05.md'


2025-11-14 16:08:39,343 - INFO - Going to convert document batch...
2025-11-14 16:08:39,346 - INFO - Processing document 4_2023-07-06
2025-11-14 16:08:39,423 - INFO - Finished converting document 4_2023-07-06 in 0.16 sec.
2025-11-14 16:08:39,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:39,543 - INFO - Going to convert document batch...
2025-11-14 16:08:39,544 - INFO - Processing document 4_2023-07-07
2025-11-14 16:08:39,608 - INFO - Finished converting document 4_2023-07-07 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-06' --> 'data\processed_data\CRM\4_2023-07-06.md'
Converted 'data\edgar_documents\CRM\4_2023-07-07' --> 'data\processed_data\CRM\4_2023-07-07.md'


2025-11-14 16:08:39,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:39,740 - INFO - Going to convert document batch...
2025-11-14 16:08:39,742 - INFO - Processing document 4_2023-07-10
2025-11-14 16:08:39,847 - INFO - Finished converting document 4_2023-07-10 in 0.17 sec.
2025-11-14 16:08:39,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:40,021 - INFO - Going to convert document batch...
2025-11-14 16:08:40,024 - INFO - Processing document 4_2023-07-11
2025-11-14 16:08:40,118 - INFO - Finished converting document 4_2023-07-11 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-10' --> 'data\processed_data\CRM\4_2023-07-10.md'


2025-11-14 16:08:40,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:40,227 - INFO - Going to convert document batch...
2025-11-14 16:08:40,228 - INFO - Processing document 4_2023-07-12
2025-11-14 16:08:40,278 - INFO - Finished converting document 4_2023-07-12 in 0.11 sec.
2025-11-14 16:08:40,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-07-11' --> 'data\processed_data\CRM\4_2023-07-11.md'
Converted 'data\edgar_documents\CRM\4_2023-07-12' --> 'data\processed_data\CRM\4_2023-07-12.md'


2025-11-14 16:08:40,394 - INFO - Going to convert document batch...
2025-11-14 16:08:40,396 - INFO - Processing document 4_2023-07-13
2025-11-14 16:08:40,477 - INFO - Finished converting document 4_2023-07-13 in 0.14 sec.
2025-11-14 16:08:40,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:40,647 - INFO - Going to convert document batch...
2025-11-14 16:08:40,649 - INFO - Processing document 4_2023-07-14
2025-11-14 16:08:40,742 - INFO - Finished converting document 4_2023-07-14 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-13' --> 'data\processed_data\CRM\4_2023-07-13.md'


2025-11-14 16:08:40,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:40,910 - INFO - Going to convert document batch...
2025-11-14 16:08:40,911 - INFO - Processing document 4_2023-07-17
2025-11-14 16:08:40,965 - INFO - Finished converting document 4_2023-07-17 in 0.12 sec.
2025-11-14 16:08:41,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-07-14' --> 'data\processed_data\CRM\4_2023-07-14.md'
Converted 'data\edgar_documents\CRM\4_2023-07-17' --> 'data\processed_data\CRM\4_2023-07-17.md'


2025-11-14 16:08:41,108 - INFO - Going to convert document batch...
2025-11-14 16:08:41,109 - INFO - Processing document 4_2023-07-18
2025-11-14 16:08:41,156 - INFO - Finished converting document 4_2023-07-18 in 0.14 sec.
2025-11-14 16:08:41,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,242 - INFO - Going to convert document batch...
2025-11-14 16:08:41,244 - INFO - Processing document 4_2023-07-19
2025-11-14 16:08:41,299 - INFO - Finished converting document 4_2023-07-19 in 0.09 sec.
2025-11-14 16:08:41,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,384 - INFO - Going to convert document batch...
2025-11-14 16:08:41,385 - INFO - Processing document 4_2023-07-20


Converted 'data\edgar_documents\CRM\4_2023-07-18' --> 'data\processed_data\CRM\4_2023-07-18.md'
Converted 'data\edgar_documents\CRM\4_2023-07-19' --> 'data\processed_data\CRM\4_2023-07-19.md'


2025-11-14 16:08:41,443 - INFO - Finished converting document 4_2023-07-20 in 0.09 sec.
2025-11-14 16:08:41,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,553 - INFO - Going to convert document batch...
2025-11-14 16:08:41,554 - INFO - Processing document 4_2023-07-21
2025-11-14 16:08:41,608 - INFO - Finished converting document 4_2023-07-21 in 0.11 sec.
2025-11-14 16:08:41,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-07-20' --> 'data\processed_data\CRM\4_2023-07-20.md'
Converted 'data\edgar_documents\CRM\4_2023-07-21' --> 'data\processed_data\CRM\4_2023-07-21.md'


2025-11-14 16:08:41,729 - INFO - Going to convert document batch...
2025-11-14 16:08:41,732 - INFO - Processing document 4_2023-07-24
2025-11-14 16:08:41,788 - INFO - Finished converting document 4_2023-07-24 in 0.12 sec.
2025-11-14 16:08:41,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,866 - INFO - Going to convert document batch...
2025-11-14 16:08:41,867 - INFO - Processing document 4_2023-07-25
2025-11-14 16:08:41,910 - INFO - Finished converting document 4_2023-07-25 in 0.08 sec.
2025-11-14 16:08:41,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,993 - INFO - Going to convert document batch...
2025-11-14 16:08:41,994 - INFO - Processing document 4_2023-07-26


Converted 'data\edgar_documents\CRM\4_2023-07-24' --> 'data\processed_data\CRM\4_2023-07-24.md'
Converted 'data\edgar_documents\CRM\4_2023-07-25' --> 'data\processed_data\CRM\4_2023-07-25.md'


2025-11-14 16:08:42,040 - INFO - Finished converting document 4_2023-07-26 in 0.06 sec.
2025-11-14 16:08:42,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,136 - INFO - Going to convert document batch...
2025-11-14 16:08:42,139 - INFO - Processing document 4_2023-07-27
2025-11-14 16:08:42,229 - INFO - Finished converting document 4_2023-07-27 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-26' --> 'data\processed_data\CRM\4_2023-07-26.md'


2025-11-14 16:08:42,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,395 - INFO - Going to convert document batch...
2025-11-14 16:08:42,396 - INFO - Processing document 4_2023-07-28
2025-11-14 16:08:42,475 - INFO - Finished converting document 4_2023-07-28 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-27' --> 'data\processed_data\CRM\4_2023-07-27.md'


2025-11-14 16:08:42,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,565 - INFO - Going to convert document batch...
2025-11-14 16:08:42,565 - INFO - Processing document 4_2023-07-31
2025-11-14 16:08:42,619 - INFO - Finished converting document 4_2023-07-31 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-28' --> 'data\processed_data\CRM\4_2023-07-28.md'
Converted 'data\edgar_documents\CRM\4_2023-07-31' --> 'data\processed_data\CRM\4_2023-07-31.md'


2025-11-14 16:08:42,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,724 - INFO - Going to convert document batch...
2025-11-14 16:08:42,726 - INFO - Processing document 4_2023-08-01
2025-11-14 16:08:42,801 - INFO - Finished converting document 4_2023-08-01 in 0.12 sec.
2025-11-14 16:08:42,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,906 - INFO - Going to convert document batch...
2025-11-14 16:08:42,908 - INFO - Processing document 4_2023-08-02
2025-11-14 16:08:42,960 - INFO - Finished converting document 4_2023-08-02 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-08-01' --> 'data\processed_data\CRM\4_2023-08-01.md'
Converted 'data\edgar_documents\CRM\4_2023-08-02' --> 'data\processed_data\CRM\4_2023-08-02.md'


2025-11-14 16:08:43,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,094 - INFO - Going to convert document batch...
2025-11-14 16:08:43,096 - INFO - Processing document 4_2023-08-03
2025-11-14 16:08:43,160 - INFO - Finished converting document 4_2023-08-03 in 0.14 sec.
2025-11-14 16:08:43,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,259 - INFO - Going to convert document batch...
2025-11-14 16:08:43,260 - INFO - Processing document 4_2023-08-04
2025-11-14 16:08:43,327 - INFO - Finished converting document 4_2023-08-04 in 0.12 sec.
2025-11-14 16:08:43,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-03' --> 'data\processed_data\CRM\4_2023-08-03.md'
Converted 'data\edgar_documents\CRM\4_2023-08-04' --> 'data\processed_data\CRM\4_2023-08-04.md'


2025-11-14 16:08:43,426 - INFO - Going to convert document batch...
2025-11-14 16:08:43,427 - INFO - Processing document 4_2023-08-07
2025-11-14 16:08:43,479 - INFO - Finished converting document 4_2023-08-07 in 0.09 sec.
2025-11-14 16:08:43,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,574 - INFO - Going to convert document batch...
2025-11-14 16:08:43,576 - INFO - Processing document 4_2023-08-08
2025-11-14 16:08:43,671 - INFO - Finished converting document 4_2023-08-08 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-08-07' --> 'data\processed_data\CRM\4_2023-08-07.md'


2025-11-14 16:08:43,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,778 - INFO - Going to convert document batch...
2025-11-14 16:08:43,779 - INFO - Processing document 4_2023-08-09
2025-11-14 16:08:43,843 - INFO - Finished converting document 4_2023-08-09 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-08-08' --> 'data\processed_data\CRM\4_2023-08-08.md'
Converted 'data\edgar_documents\CRM\4_2023-08-09' --> 'data\processed_data\CRM\4_2023-08-09.md'


2025-11-14 16:08:43,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,953 - INFO - Going to convert document batch...
2025-11-14 16:08:43,954 - INFO - Processing document 4_2023-08-10
2025-11-14 16:08:44,010 - INFO - Finished converting document 4_2023-08-10 in 0.11 sec.
2025-11-14 16:08:44,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:44,124 - INFO - Going to convert document batch...
2025-11-14 16:08:44,126 - INFO - Processing document 4_2023-08-11
2025-11-14 16:08:44,178 - INFO - Finished converting document 4_2023-08-11 in 0.09 sec.
2025-11-14 16:08:44,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-10' --> 'data\processed_data\CRM\4_2023-08-10.md'
Converted 'data\edgar_documents\CRM\4_2023-08-11' --> 'data\processed_data\CRM\4_2023-08-11.md'


2025-11-14 16:08:44,307 - INFO - Going to convert document batch...
2025-11-14 16:08:44,308 - INFO - Processing document 4_2023-08-14
2025-11-14 16:08:44,357 - INFO - Finished converting document 4_2023-08-14 in 0.11 sec.
2025-11-14 16:08:44,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:44,440 - INFO - Going to convert document batch...
2025-11-14 16:08:44,441 - INFO - Processing document 4_2023-08-15
2025-11-14 16:08:44,492 - INFO - Finished converting document 4_2023-08-15 in 0.08 sec.
2025-11-14 16:08:44,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:44,612 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-08-14' --> 'data\processed_data\CRM\4_2023-08-14.md'
Converted 'data\edgar_documents\CRM\4_2023-08-15' --> 'data\processed_data\CRM\4_2023-08-15.md'


2025-11-14 16:08:44,614 - INFO - Processing document 4_2023-08-16
2025-11-14 16:08:44,696 - INFO - Finished converting document 4_2023-08-16 in 0.14 sec.
2025-11-14 16:08:44,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:44,788 - INFO - Going to convert document batch...
2025-11-14 16:08:44,789 - INFO - Processing document 4_2023-08-17
2025-11-14 16:08:44,845 - INFO - Finished converting document 4_2023-08-17 in 0.09 sec.
2025-11-14 16:08:44,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-16' --> 'data\processed_data\CRM\4_2023-08-16.md'
Converted 'data\edgar_documents\CRM\4_2023-08-17' --> 'data\processed_data\CRM\4_2023-08-17.md'


2025-11-14 16:08:45,695 - INFO - Going to convert document batch...
2025-11-14 16:08:45,700 - INFO - Processing document 4_2023-08-18
2025-11-14 16:08:45,777 - INFO - Finished converting document 4_2023-08-18 in 0.88 sec.
2025-11-14 16:08:45,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:45,883 - INFO - Going to convert document batch...
2025-11-14 16:08:45,887 - INFO - Processing document 4_2023-08-21
2025-11-14 16:08:45,945 - INFO - Finished converting document 4_2023-08-21 in 0.11 sec.
2025-11-14 16:08:46,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-18' --> 'data\processed_data\CRM\4_2023-08-18.md'
Converted 'data\edgar_documents\CRM\4_2023-08-21' --> 'data\processed_data\CRM\4_2023-08-21.md'


2025-11-14 16:08:46,068 - INFO - Going to convert document batch...
2025-11-14 16:08:46,070 - INFO - Processing document 4_2023-08-22
2025-11-14 16:08:46,158 - INFO - Finished converting document 4_2023-08-22 in 0.16 sec.
2025-11-14 16:08:46,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:46,238 - INFO - Going to convert document batch...
2025-11-14 16:08:46,240 - INFO - Processing document 4_2023-08-23
2025-11-14 16:08:46,275 - INFO - Finished converting document 4_2023-08-23 in 0.06 sec.
2025-11-14 16:08:46,343 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:46,372 - INFO - Going to convert document batch...
2025-11-14 16:08:46,374 - INFO - Processing document 4_2023-08-24


Converted 'data\edgar_documents\CRM\4_2023-08-22' --> 'data\processed_data\CRM\4_2023-08-22.md'
Converted 'data\edgar_documents\CRM\4_2023-08-23' --> 'data\processed_data\CRM\4_2023-08-23.md'


2025-11-14 16:08:46,440 - INFO - Finished converting document 4_2023-08-24 in 0.11 sec.
2025-11-14 16:08:46,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:46,529 - INFO - Going to convert document batch...
2025-11-14 16:08:46,531 - INFO - Processing document 4_2023-08-25
2025-11-14 16:08:46,589 - INFO - Finished converting document 4_2023-08-25 in 0.11 sec.
2025-11-14 16:08:46,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-24' --> 'data\processed_data\CRM\4_2023-08-24.md'
Converted 'data\edgar_documents\CRM\4_2023-08-25' --> 'data\processed_data\CRM\4_2023-08-25.md'


2025-11-14 16:08:46,725 - INFO - Going to convert document batch...
2025-11-14 16:08:46,726 - INFO - Processing document 4_2023-08-28
2025-11-14 16:08:46,788 - INFO - Finished converting document 4_2023-08-28 in 0.14 sec.
2025-11-14 16:08:46,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:46,888 - INFO - Going to convert document batch...
2025-11-14 16:08:46,889 - INFO - Processing document 4_2023-08-29
2025-11-14 16:08:46,940 - INFO - Finished converting document 4_2023-08-29 in 0.09 sec.
2025-11-14 16:08:47,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:47,036 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-08-28' --> 'data\processed_data\CRM\4_2023-08-28.md'
Converted 'data\edgar_documents\CRM\4_2023-08-29' --> 'data\processed_data\CRM\4_2023-08-29.md'


2025-11-14 16:08:47,037 - INFO - Processing document 4_2023-08-30
2025-11-14 16:08:47,107 - INFO - Finished converting document 4_2023-08-30 in 0.12 sec.
2025-11-14 16:08:47,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:47,211 - INFO - Going to convert document batch...
2025-11-14 16:08:47,214 - INFO - Processing document 4_2023-08-31
2025-11-14 16:08:47,296 - INFO - Finished converting document 4_2023-08-31 in 0.14 sec.
2025-11-14 16:08:47,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-30' --> 'data\processed_data\CRM\4_2023-08-30.md'
Converted 'data\edgar_documents\CRM\4_2023-08-31' --> 'data\processed_data\CRM\4_2023-08-31.md'


2025-11-14 16:08:47,409 - INFO - Going to convert document batch...
2025-11-14 16:08:47,412 - INFO - Processing document 4_2023-09-01
2025-11-14 16:08:47,502 - INFO - Finished converting document 4_2023-09-01 in 0.16 sec.
2025-11-14 16:08:47,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:47,622 - INFO - Going to convert document batch...
2025-11-14 16:08:47,624 - INFO - Processing document 4_2023-09-05
2025-11-14 16:08:47,716 - INFO - Finished converting document 4_2023-09-05 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2023-09-01' --> 'data\processed_data\CRM\4_2023-09-01.md'


2025-11-14 16:08:47,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:47,806 - INFO - Going to convert document batch...
2025-11-14 16:08:47,807 - INFO - Processing document 4_2023-09-06
2025-11-14 16:08:47,868 - INFO - Finished converting document 4_2023-09-06 in 0.09 sec.
2025-11-14 16:08:47,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-09-05' --> 'data\processed_data\CRM\4_2023-09-05.md'
Converted 'data\edgar_documents\CRM\4_2023-09-06' --> 'data\processed_data\CRM\4_2023-09-06.md'


2025-11-14 16:08:47,976 - INFO - Going to convert document batch...
2025-11-14 16:08:47,978 - INFO - Processing document 4_2023-09-07
2025-11-14 16:08:48,055 - INFO - Finished converting document 4_2023-09-07 in 0.14 sec.
2025-11-14 16:08:48,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,142 - INFO - Going to convert document batch...
2025-11-14 16:08:48,142 - INFO - Processing document 4_2023-09-08
2025-11-14 16:08:48,189 - INFO - Finished converting document 4_2023-09-08 in 0.08 sec.
2025-11-14 16:08:48,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,286 - INFO - Going to convert document batch...
2025-11-14 16:08:48,287 - INFO - Processing document 4_2023-09-11


Converted 'data\edgar_documents\CRM\4_2023-09-07' --> 'data\processed_data\CRM\4_2023-09-07.md'
Converted 'data\edgar_documents\CRM\4_2023-09-08' --> 'data\processed_data\CRM\4_2023-09-08.md'


2025-11-14 16:08:48,351 - INFO - Finished converting document 4_2023-09-11 in 0.11 sec.
2025-11-14 16:08:48,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,438 - INFO - Going to convert document batch...
2025-11-14 16:08:48,439 - INFO - Processing document 4_2023-09-12
2025-11-14 16:08:48,483 - INFO - Finished converting document 4_2023-09-12 in 0.08 sec.
2025-11-14 16:08:48,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,593 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-09-11' --> 'data\processed_data\CRM\4_2023-09-11.md'
Converted 'data\edgar_documents\CRM\4_2023-09-12' --> 'data\processed_data\CRM\4_2023-09-12.md'


2025-11-14 16:08:48,595 - INFO - Processing document 4_2023-09-13
2025-11-14 16:08:48,675 - INFO - Finished converting document 4_2023-09-13 in 0.16 sec.
2025-11-14 16:08:48,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,761 - INFO - Going to convert document batch...
2025-11-14 16:08:48,763 - INFO - Processing document 4_2023-09-14
2025-11-14 16:08:48,814 - INFO - Finished converting document 4_2023-09-14 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-09-13' --> 'data\processed_data\CRM\4_2023-09-13.md'
Converted 'data\edgar_documents\CRM\4_2023-09-14' --> 'data\processed_data\CRM\4_2023-09-14.md'


2025-11-14 16:08:48,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,939 - INFO - Going to convert document batch...
2025-11-14 16:08:48,941 - INFO - Processing document 4_2023-09-15
2025-11-14 16:08:49,006 - INFO - Finished converting document 4_2023-09-15 in 0.12 sec.
2025-11-14 16:08:49,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:49,186 - INFO - Going to convert document batch...
2025-11-14 16:08:49,189 - INFO - Processing document 4_2023-09-18


Converted 'data\edgar_documents\CRM\4_2023-09-15' --> 'data\processed_data\CRM\4_2023-09-15.md'


2025-11-14 16:08:49,303 - INFO - Finished converting document 4_2023-09-18 in 0.23 sec.
2025-11-14 16:08:49,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:49,386 - INFO - Going to convert document batch...
2025-11-14 16:08:49,388 - INFO - Processing document 4_2023-09-19
2025-11-14 16:08:49,440 - INFO - Finished converting document 4_2023-09-19 in 0.09 sec.
2025-11-14 16:08:49,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-09-18' --> 'data\processed_data\CRM\4_2023-09-18.md'
Converted 'data\edgar_documents\CRM\4_2023-09-19' --> 'data\processed_data\CRM\4_2023-09-19.md'


2025-11-14 16:08:49,584 - INFO - Going to convert document batch...
2025-11-14 16:08:49,585 - INFO - Processing document 4_2023-09-20
2025-11-14 16:08:49,658 - INFO - Finished converting document 4_2023-09-20 in 0.14 sec.
2025-11-14 16:08:49,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:49,776 - INFO - Going to convert document batch...
2025-11-14 16:08:49,782 - INFO - Processing document 4_2023-09-21
2025-11-14 16:08:49,869 - INFO - Finished converting document 4_2023-09-21 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-09-20' --> 'data\processed_data\CRM\4_2023-09-20.md'


2025-11-14 16:08:49,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:49,985 - INFO - Going to convert document batch...
2025-11-14 16:08:49,986 - INFO - Processing document 4_2023-09-22
2025-11-14 16:08:50,038 - INFO - Finished converting document 4_2023-09-22 in 0.09 sec.
2025-11-14 16:08:50,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:50,150 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-09-21' --> 'data\processed_data\CRM\4_2023-09-21.md'
Converted 'data\edgar_documents\CRM\4_2023-09-22' --> 'data\processed_data\CRM\4_2023-09-22.md'


2025-11-14 16:08:50,151 - INFO - Processing document 4_2023-09-25
2025-11-14 16:08:50,230 - INFO - Finished converting document 4_2023-09-25 in 0.16 sec.
2025-11-14 16:08:50,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:50,333 - INFO - Going to convert document batch...
2025-11-14 16:08:50,334 - INFO - Processing document 4_2023-09-26
2025-11-14 16:08:50,391 - INFO - Finished converting document 4_2023-09-26 in 0.11 sec.
2025-11-14 16:08:50,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-09-25' --> 'data\processed_data\CRM\4_2023-09-25.md'
Converted 'data\edgar_documents\CRM\4_2023-09-26' --> 'data\processed_data\CRM\4_2023-09-26.md'


2025-11-14 16:08:50,502 - INFO - Going to convert document batch...
2025-11-14 16:08:50,503 - INFO - Processing document 4_2023-09-27
2025-11-14 16:08:50,556 - INFO - Finished converting document 4_2023-09-27 in 0.09 sec.
2025-11-14 16:08:50,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:50,667 - INFO - Going to convert document batch...
2025-11-14 16:08:50,669 - INFO - Processing document 4_2023-09-28
2025-11-14 16:08:50,752 - INFO - Finished converting document 4_2023-09-28 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-09-27' --> 'data\processed_data\CRM\4_2023-09-27.md'


2025-11-14 16:08:50,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:50,877 - INFO - Going to convert document batch...
2025-11-14 16:08:50,878 - INFO - Processing document 4_2023-09-29
2025-11-14 16:08:50,941 - INFO - Finished converting document 4_2023-09-29 in 0.11 sec.
2025-11-14 16:08:51,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,030 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-09-28' --> 'data\processed_data\CRM\4_2023-09-28.md'
Converted 'data\edgar_documents\CRM\4_2023-09-29' --> 'data\processed_data\CRM\4_2023-09-29.md'


2025-11-14 16:08:51,032 - INFO - Processing document 4_2023-10-02
2025-11-14 16:08:51,086 - INFO - Finished converting document 4_2023-10-02 in 0.09 sec.
2025-11-14 16:08:51,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,196 - INFO - Going to convert document batch...
2025-11-14 16:08:51,198 - INFO - Processing document 4_2023-10-03
2025-11-14 16:08:51,270 - INFO - Finished converting document 4_2023-10-03 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-10-02' --> 'data\processed_data\CRM\4_2023-10-02.md'
Converted 'data\edgar_documents\CRM\4_2023-10-03' --> 'data\processed_data\CRM\4_2023-10-03.md'


2025-11-14 16:08:51,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,420 - INFO - Going to convert document batch...
2025-11-14 16:08:51,421 - INFO - Processing document 4_2023-10-04
2025-11-14 16:08:51,492 - INFO - Finished converting document 4_2023-10-04 in 0.14 sec.
2025-11-14 16:08:51,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,621 - INFO - Going to convert document batch...
2025-11-14 16:08:51,622 - INFO - Processing document 4_2023-10-05
2025-11-14 16:08:51,666 - INFO - Finished converting document 4_2023-10-05 in 0.09 sec.
2025-11-14 16:08:51,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,744 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-10-04' --> 'data\processed_data\CRM\4_2023-10-04.md'
Converted 'data\edgar_documents\CRM\4_2023-10-05' --> 'data\processed_data\CRM\4_2023-10-05.md'


2025-11-14 16:08:51,745 - INFO - Processing document 4_2023-10-06
2025-11-14 16:08:51,798 - INFO - Finished converting document 4_2023-10-06 in 0.09 sec.
2025-11-14 16:08:51,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,896 - INFO - Going to convert document batch...
2025-11-14 16:08:51,897 - INFO - Processing document 4_2023-10-10
2025-11-14 16:08:51,945 - INFO - Finished converting document 4_2023-10-10 in 0.09 sec.
2025-11-14 16:08:52,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:52,046 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-10-06' --> 'data\processed_data\CRM\4_2023-10-06.md'
Converted 'data\edgar_documents\CRM\4_2023-10-10' --> 'data\processed_data\CRM\4_2023-10-10.md'


2025-11-14 16:08:52,047 - INFO - Processing document 4_2023-10-11
2025-11-14 16:08:52,103 - INFO - Finished converting document 4_2023-10-11 in 0.11 sec.
2025-11-14 16:08:52,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:52,190 - INFO - Going to convert document batch...
2025-11-14 16:08:52,191 - INFO - Processing document 4_2023-10-12
2025-11-14 16:08:52,242 - INFO - Finished converting document 4_2023-10-12 in 0.09 sec.
2025-11-14 16:08:52,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-10-11' --> 'data\processed_data\CRM\4_2023-10-11.md'
Converted 'data\edgar_documents\CRM\4_2023-10-12' --> 'data\processed_data\CRM\4_2023-10-12.md'


2025-11-14 16:08:52,381 - INFO - Going to convert document batch...
2025-11-14 16:08:52,383 - INFO - Processing document 4_2023-10-13
2025-11-14 16:08:53,097 - INFO - Finished converting document 4_2023-10-13 in 0.78 sec.
2025-11-14 16:08:53,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:53,237 - INFO - Going to convert document batch...
2025-11-14 16:08:53,239 - INFO - Processing document 4_2023-10-16
2025-11-14 16:08:53,309 - INFO - Finished converting document 4_2023-10-16 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-10-13' --> 'data\processed_data\CRM\4_2023-10-13.md'
Converted 'data\edgar_documents\CRM\4_2023-10-16' --> 'data\processed_data\CRM\4_2023-10-16.md'


2025-11-14 16:08:53,395 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:53,420 - INFO - Going to convert document batch...
2025-11-14 16:08:53,421 - INFO - Processing document 4_2023-10-17
2025-11-14 16:08:53,473 - INFO - Finished converting document 4_2023-10-17 in 0.11 sec.
2025-11-14 16:08:53,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:53,570 - INFO - Going to convert document batch...
2025-11-14 16:08:53,571 - INFO - Processing document 4_2023-10-18
2025-11-14 16:08:53,620 - INFO - Finished converting document 4_2023-10-18 in 0.09 sec.
2025-11-14 16:08:53,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-10-17' --> 'data\processed_data\CRM\4_2023-10-17.md'
Converted 'data\edgar_documents\CRM\4_2023-10-18' --> 'data\processed_data\CRM\4_2023-10-18.md'


2025-11-14 16:08:53,745 - INFO - Going to convert document batch...
2025-11-14 16:08:53,747 - INFO - Processing document 4_2023-10-19
2025-11-14 16:08:53,843 - INFO - Finished converting document 4_2023-10-19 in 0.16 sec.
2025-11-14 16:08:53,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:53,938 - INFO - Going to convert document batch...
2025-11-14 16:08:53,939 - INFO - Processing document 4_2023-10-20
2025-11-14 16:08:53,990 - INFO - Finished converting document 4_2023-10-20 in 0.09 sec.
2025-11-14 16:08:54,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,088 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-10-19' --> 'data\processed_data\CRM\4_2023-10-19.md'
Converted 'data\edgar_documents\CRM\4_2023-10-20' --> 'data\processed_data\CRM\4_2023-10-20.md'


2025-11-14 16:08:54,090 - INFO - Processing document 4_2023-10-23
2025-11-14 16:08:54,170 - INFO - Finished converting document 4_2023-10-23 in 0.12 sec.
2025-11-14 16:08:54,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,283 - INFO - Going to convert document batch...
2025-11-14 16:08:54,284 - INFO - Processing document 4_2023-10-24
2025-11-14 16:08:54,330 - INFO - Finished converting document 4_2023-10-24 in 0.09 sec.
2025-11-14 16:08:54,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,415 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-10-23' --> 'data\processed_data\CRM\4_2023-10-23.md'
Converted 'data\edgar_documents\CRM\4_2023-10-24' --> 'data\processed_data\CRM\4_2023-10-24.md'


2025-11-14 16:08:54,417 - INFO - Processing document 4_2023-10-25
2025-11-14 16:08:54,474 - INFO - Finished converting document 4_2023-10-25 in 0.09 sec.
2025-11-14 16:08:54,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,598 - INFO - Going to convert document batch...
2025-11-14 16:08:54,599 - INFO - Processing document 4_2023-10-26
2025-11-14 16:08:54,657 - INFO - Finished converting document 4_2023-10-26 in 0.11 sec.
2025-11-14 16:08:54,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-10-25' --> 'data\processed_data\CRM\4_2023-10-25.md'
Converted 'data\edgar_documents\CRM\4_2023-10-26' --> 'data\processed_data\CRM\4_2023-10-26.md'


2025-11-14 16:08:54,786 - INFO - Going to convert document batch...
2025-11-14 16:08:54,787 - INFO - Processing document 4_2023-10-27
2025-11-14 16:08:54,869 - INFO - Finished converting document 4_2023-10-27 in 0.16 sec.
2025-11-14 16:08:54,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,980 - INFO - Going to convert document batch...
2025-11-14 16:08:54,981 - INFO - Processing document 4_2023-10-30
2025-11-14 16:08:55,023 - INFO - Finished converting document 4_2023-10-30 in 0.08 sec.
2025-11-14 16:08:55,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-10-27' --> 'data\processed_data\CRM\4_2023-10-27.md'
Converted 'data\edgar_documents\CRM\4_2023-10-30' --> 'data\processed_data\CRM\4_2023-10-30.md'


2025-11-14 16:08:55,144 - INFO - Going to convert document batch...
2025-11-14 16:08:55,147 - INFO - Processing document 4_2023-10-31
2025-11-14 16:08:55,201 - INFO - Finished converting document 4_2023-10-31 in 0.11 sec.
2025-11-14 16:08:55,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:55,307 - INFO - Going to convert document batch...
2025-11-14 16:08:55,309 - INFO - Processing document 4_2023-11-01
2025-11-14 16:08:55,416 - INFO - Finished converting document 4_2023-11-01 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-10-31' --> 'data\processed_data\CRM\4_2023-10-31.md'


2025-11-14 16:08:55,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:55,561 - INFO - Going to convert document batch...
2025-11-14 16:08:55,565 - INFO - Processing document 4_2023-11-02


Converted 'data\edgar_documents\CRM\4_2023-11-01' --> 'data\processed_data\CRM\4_2023-11-01.md'


2025-11-14 16:08:55,739 - INFO - Finished converting document 4_2023-11-02 in 0.23 sec.
2025-11-14 16:08:55,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:55,817 - INFO - Going to convert document batch...
2025-11-14 16:08:55,818 - INFO - Processing document 4_2023-11-03
2025-11-14 16:08:55,862 - INFO - Finished converting document 4_2023-11-03 in 0.08 sec.
2025-11-14 16:08:55,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:55,941 - INFO - Going to convert document batch...
2025-11-14 16:08:55,941 - INFO - Processing document 4_2023-11-06
2025-11-14 16:08:55,987 - INFO - Finished converting document 4_2023-11-06 in 0.08 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-02' --> 'data\processed_data\CRM\4_2023-11-02.md'
Converted 'data\edgar_documents\CRM\4_2023-11-03' --> 'data\processed_data\CRM\4_2023-11-03.md'


2025-11-14 16:08:56,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:56,067 - INFO - Going to convert document batch...
2025-11-14 16:08:56,069 - INFO - Processing document 4_2023-11-07
2025-11-14 16:08:56,158 - INFO - Finished converting document 4_2023-11-07 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-06' --> 'data\processed_data\CRM\4_2023-11-06.md'


2025-11-14 16:08:56,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:56,327 - INFO - Going to convert document batch...
2025-11-14 16:08:56,329 - INFO - Processing document 4_2023-11-08
2025-11-14 16:08:56,390 - INFO - Finished converting document 4_2023-11-08 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-07' --> 'data\processed_data\CRM\4_2023-11-07.md'


2025-11-14 16:08:56,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:56,566 - INFO - Going to convert document batch...
2025-11-14 16:08:56,567 - INFO - Processing document 4_2023-11-09
2025-11-14 16:08:56,629 - INFO - Finished converting document 4_2023-11-09 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-08' --> 'data\processed_data\CRM\4_2023-11-08.md'


2025-11-14 16:08:56,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:56,745 - INFO - Going to convert document batch...
2025-11-14 16:08:56,747 - INFO - Processing document 4_2023-11-13
2025-11-14 16:08:56,818 - INFO - Finished converting document 4_2023-11-13 in 0.12 sec.
2025-11-14 16:08:56,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-11-09' --> 'data\processed_data\CRM\4_2023-11-09.md'
Converted 'data\edgar_documents\CRM\4_2023-11-13' --> 'data\processed_data\CRM\4_2023-11-13.md'


2025-11-14 16:08:56,917 - INFO - Going to convert document batch...
2025-11-14 16:08:56,918 - INFO - Processing document 4_2023-11-14
2025-11-14 16:08:56,968 - INFO - Finished converting document 4_2023-11-14 in 0.11 sec.
2025-11-14 16:08:57,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,066 - INFO - Going to convert document batch...
2025-11-14 16:08:57,067 - INFO - Processing document 4_2023-11-15
2025-11-14 16:08:57,162 - INFO - Finished converting document 4_2023-11-15 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-14' --> 'data\processed_data\CRM\4_2023-11-14.md'


2025-11-14 16:08:57,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,316 - INFO - Going to convert document batch...
2025-11-14 16:08:57,318 - INFO - Processing document 4_2023-11-16
2025-11-14 16:08:57,395 - INFO - Finished converting document 4_2023-11-16 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-15' --> 'data\processed_data\CRM\4_2023-11-15.md'


2025-11-14 16:08:57,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,518 - INFO - Going to convert document batch...
2025-11-14 16:08:57,520 - INFO - Processing document 4_2023-11-17
2025-11-14 16:08:57,603 - INFO - Finished converting document 4_2023-11-17 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-16' --> 'data\processed_data\CRM\4_2023-11-16.md'
Converted 'data\edgar_documents\CRM\4_2023-11-17' --> 'data\processed_data\CRM\4_2023-11-17.md'


2025-11-14 16:08:57,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,718 - INFO - Going to convert document batch...
2025-11-14 16:08:57,720 - INFO - Processing document 4_2023-11-20
2025-11-14 16:08:57,790 - INFO - Finished converting document 4_2023-11-20 in 0.12 sec.
2025-11-14 16:08:57,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,936 - INFO - Going to convert document batch...
2025-11-14 16:08:57,939 - INFO - Processing document 4_2023-11-21
2025-11-14 16:08:58,003 - INFO - Finished converting document 4_2023-11-21 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-20' --> 'data\processed_data\CRM\4_2023-11-20.md'
Converted 'data\edgar_documents\CRM\4_2023-11-21' --> 'data\processed_data\CRM\4_2023-11-21.md'


2025-11-14 16:08:58,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:58,111 - INFO - Going to convert document batch...
2025-11-14 16:08:58,112 - INFO - Processing document 4_2023-11-22
2025-11-14 16:08:58,159 - INFO - Finished converting document 4_2023-11-22 in 0.11 sec.
2025-11-14 16:08:58,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:58,294 - INFO - Going to convert document batch...
2025-11-14 16:08:58,296 - INFO - Processing document 4_2023-11-24
2025-11-14 16:08:58,338 - INFO - Finished converting document 4_2023-11-24 in 0.12 sec.
2025-11-14 16:08:58,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-11-22' --> 'data\processed_data\CRM\4_2023-11-22.md'
Converted 'data\edgar_documents\CRM\4_2023-11-24' --> 'data\processed_data\CRM\4_2023-11-24.md'


2025-11-14 16:08:58,463 - INFO - Going to convert document batch...
2025-11-14 16:08:58,464 - INFO - Processing document 4_2023-11-27
2025-11-14 16:08:58,587 - INFO - Finished converting document 4_2023-11-27 in 0.20 sec.
2025-11-14 16:08:58,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:58,723 - INFO - Going to convert document batch...
2025-11-14 16:08:58,724 - INFO - Processing document 4_2023-11-28
2025-11-14 16:08:58,780 - INFO - Finished converting document 4_2023-11-28 in 0.11 sec.
2025-11-14 16:08:58,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:58,867 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-11-27' --> 'data\processed_data\CRM\4_2023-11-27.md'
Converted 'data\edgar_documents\CRM\4_2023-11-28' --> 'data\processed_data\CRM\4_2023-11-28.md'


2025-11-14 16:08:58,868 - INFO - Processing document 4_2023-11-29
2025-11-14 16:08:58,916 - INFO - Finished converting document 4_2023-11-29 in 0.09 sec.
2025-11-14 16:08:58,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,000 - INFO - Going to convert document batch...
2025-11-14 16:08:59,001 - INFO - Processing document 4_2023-11-30
2025-11-14 16:08:59,055 - INFO - Finished converting document 4_2023-11-30 in 0.09 sec.
2025-11-14 16:08:59,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-11-29' --> 'data\processed_data\CRM\4_2023-11-29.md'
Converted 'data\edgar_documents\CRM\4_2023-11-30' --> 'data\processed_data\CRM\4_2023-11-30.md'


2025-11-14 16:08:59,191 - INFO - Going to convert document batch...
2025-11-14 16:08:59,193 - INFO - Processing document 4_2023-12-01
2025-11-14 16:08:59,282 - INFO - Finished converting document 4_2023-12-01 in 0.17 sec.
2025-11-14 16:08:59,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,371 - INFO - Going to convert document batch...
2025-11-14 16:08:59,373 - INFO - Processing document 4_2023-12-04
2025-11-14 16:08:59,432 - INFO - Finished converting document 4_2023-12-04 in 0.11 sec.
2025-11-14 16:08:59,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,515 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-12-01' --> 'data\processed_data\CRM\4_2023-12-01.md'
Converted 'data\edgar_documents\CRM\4_2023-12-04' --> 'data\processed_data\CRM\4_2023-12-04.md'


2025-11-14 16:08:59,516 - INFO - Processing document 4_2023-12-05
2025-11-14 16:08:59,565 - INFO - Finished converting document 4_2023-12-05 in 0.09 sec.
2025-11-14 16:08:59,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,648 - INFO - Going to convert document batch...
2025-11-14 16:08:59,650 - INFO - Processing document 4_2023-12-06
2025-11-14 16:08:59,703 - INFO - Finished converting document 4_2023-12-06 in 0.09 sec.
2025-11-14 16:08:59,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,784 - INFO - Going to convert document batch...
2025-11-14 16:08:59,786 - INFO - Processing document 4_2023-12-07


Converted 'data\edgar_documents\CRM\4_2023-12-05' --> 'data\processed_data\CRM\4_2023-12-05.md'
Converted 'data\edgar_documents\CRM\4_2023-12-06' --> 'data\processed_data\CRM\4_2023-12-06.md'


2025-11-14 16:08:59,838 - INFO - Finished converting document 4_2023-12-07 in 0.09 sec.
2025-11-14 16:08:59,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-12-07' --> 'data\processed_data\CRM\4_2023-12-07.md'


2025-11-14 16:09:00,464 - INFO - Going to convert document batch...
2025-11-14 16:09:00,467 - INFO - Processing document 4_2023-12-08
2025-11-14 16:09:00,573 - INFO - Finished converting document 4_2023-12-08 in 0.69 sec.
2025-11-14 16:09:00,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:00,717 - INFO - Going to convert document batch...
2025-11-14 16:09:00,719 - INFO - Processing document 4_2023-12-11
2025-11-14 16:09:00,806 - INFO - Finished converting document 4_2023-12-11 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-08' --> 'data\processed_data\CRM\4_2023-12-08.md'


2025-11-14 16:09:00,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:00,945 - INFO - Going to convert document batch...
2025-11-14 16:09:00,947 - INFO - Processing document 4_2023-12-12
2025-11-14 16:09:01,030 - INFO - Finished converting document 4_2023-12-12 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-11' --> 'data\processed_data\CRM\4_2023-12-11.md'


2025-11-14 16:09:01,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:01,171 - INFO - Going to convert document batch...
2025-11-14 16:09:01,173 - INFO - Processing document 4_2023-12-13
2025-11-14 16:09:01,243 - INFO - Finished converting document 4_2023-12-13 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-12' --> 'data\processed_data\CRM\4_2023-12-12.md'


2025-11-14 16:09:01,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:01,350 - INFO - Going to convert document batch...
2025-11-14 16:09:01,351 - INFO - Processing document 4_2023-12-14
2025-11-14 16:09:01,403 - INFO - Finished converting document 4_2023-12-14 in 0.09 sec.
2025-11-14 16:09:01,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-12-13' --> 'data\processed_data\CRM\4_2023-12-13.md'
Converted 'data\edgar_documents\CRM\4_2023-12-14' --> 'data\processed_data\CRM\4_2023-12-14.md'


2025-11-14 16:09:01,523 - INFO - Going to convert document batch...
2025-11-14 16:09:01,526 - INFO - Processing document 4_2023-12-15
2025-11-14 16:09:01,603 - INFO - Finished converting document 4_2023-12-15 in 0.14 sec.
2025-11-14 16:09:01,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:01,691 - INFO - Going to convert document batch...
2025-11-14 16:09:01,693 - INFO - Processing document 4_2023-12-18
2025-11-14 16:09:01,747 - INFO - Finished converting document 4_2023-12-18 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-15' --> 'data\processed_data\CRM\4_2023-12-15.md'
Converted 'data\edgar_documents\CRM\4_2023-12-18' --> 'data\processed_data\CRM\4_2023-12-18.md'


2025-11-14 16:09:01,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:01,897 - INFO - Going to convert document batch...
2025-11-14 16:09:01,899 - INFO - Processing document 4_2023-12-19
2025-11-14 16:09:01,952 - INFO - Finished converting document 4_2023-12-19 in 0.14 sec.
2025-11-14 16:09:02,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,062 - INFO - Going to convert document batch...
2025-11-14 16:09:02,064 - INFO - Processing document 4_2023-12-20
2025-11-14 16:09:02,107 - INFO - Finished converting document 4_2023-12-20 in 0.09 sec.
2025-11-14 16:09:02,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,232 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-12-19' --> 'data\processed_data\CRM\4_2023-12-19.md'
Converted 'data\edgar_documents\CRM\4_2023-12-20' --> 'data\processed_data\CRM\4_2023-12-20.md'


2025-11-14 16:09:02,234 - INFO - Processing document 4_2023-12-21
2025-11-14 16:09:02,327 - INFO - Finished converting document 4_2023-12-21 in 0.17 sec.
2025-11-14 16:09:02,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,426 - INFO - Going to convert document batch...
2025-11-14 16:09:02,429 - INFO - Processing document 4_2023-12-22
2025-11-14 16:09:02,484 - INFO - Finished converting document 4_2023-12-22 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-21' --> 'data\processed_data\CRM\4_2023-12-21.md'
Converted 'data\edgar_documents\CRM\4_2023-12-22' --> 'data\processed_data\CRM\4_2023-12-22.md'


2025-11-14 16:09:02,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,637 - INFO - Going to convert document batch...
2025-11-14 16:09:02,638 - INFO - Processing document 4_2023-12-26
2025-11-14 16:09:02,720 - INFO - Finished converting document 4_2023-12-26 in 0.17 sec.
2025-11-14 16:09:02,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,864 - INFO - Going to convert document batch...
2025-11-14 16:09:02,867 - INFO - Processing document 4_2023-12-27
2025-11-14 16:09:02,948 - INFO - Finished converting document 4_2023-12-27 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-26' --> 'data\processed_data\CRM\4_2023-12-26.md'


2025-11-14 16:09:03,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,062 - INFO - Going to convert document batch...
2025-11-14 16:09:03,063 - INFO - Processing document 4_2023-12-28
2025-11-14 16:09:03,102 - INFO - Finished converting document 4_2023-12-28 in 0.08 sec.
2025-11-14 16:09:03,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,204 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-12-27' --> 'data\processed_data\CRM\4_2023-12-27.md'
Converted 'data\edgar_documents\CRM\4_2023-12-28' --> 'data\processed_data\CRM\4_2023-12-28.md'


2025-11-14 16:09:03,205 - INFO - Processing document 4_2023-12-29
2025-11-14 16:09:03,269 - INFO - Finished converting document 4_2023-12-29 in 0.12 sec.
2025-11-14 16:09:03,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,367 - INFO - Going to convert document batch...
2025-11-14 16:09:03,368 - INFO - Processing document 4_2024-01-03
2025-11-14 16:09:03,419 - INFO - Finished converting document 4_2024-01-03 in 0.09 sec.
2025-11-14 16:09:03,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,518 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-12-29' --> 'data\processed_data\CRM\4_2023-12-29.md'
Converted 'data\edgar_documents\CRM\4_2024-01-03' --> 'data\processed_data\CRM\4_2024-01-03.md'


2025-11-14 16:09:03,520 - INFO - Processing document 4_2024-01-04
2025-11-14 16:09:03,585 - INFO - Finished converting document 4_2024-01-04 in 0.11 sec.
2025-11-14 16:09:03,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,688 - INFO - Going to convert document batch...
2025-11-14 16:09:03,690 - INFO - Processing document 4_2024-01-05
2025-11-14 16:09:03,747 - INFO - Finished converting document 4_2024-01-05 in 0.11 sec.
2025-11-14 16:09:03,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-04' --> 'data\processed_data\CRM\4_2024-01-04.md'
Converted 'data\edgar_documents\CRM\4_2024-01-05' --> 'data\processed_data\CRM\4_2024-01-05.md'


2025-11-14 16:09:03,876 - INFO - Going to convert document batch...
2025-11-14 16:09:03,877 - INFO - Processing document 4_2024-01-08
2025-11-14 16:09:03,946 - INFO - Finished converting document 4_2024-01-08 in 0.14 sec.
2025-11-14 16:09:04,004 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:04,025 - INFO - Going to convert document batch...
2025-11-14 16:09:04,026 - INFO - Processing document 4_2024-01-09
2025-11-14 16:09:04,111 - INFO - Finished converting document 4_2024-01-09 in 0.12 sec.
2025-11-14 16:09:04,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-08' --> 'data\processed_data\CRM\4_2024-01-08.md'
Converted 'data\edgar_documents\CRM\4_2024-01-09' --> 'data\processed_data\CRM\4_2024-01-09.md'


2025-11-14 16:09:04,205 - INFO - Going to convert document batch...
2025-11-14 16:09:04,207 - INFO - Processing document 4_2024-01-10
2025-11-14 16:09:04,266 - INFO - Finished converting document 4_2024-01-10 in 0.11 sec.
2025-11-14 16:09:04,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:04,376 - INFO - Going to convert document batch...
2025-11-14 16:09:04,378 - INFO - Processing document 4_2024-01-11
2025-11-14 16:09:04,450 - INFO - Finished converting document 4_2024-01-11 in 0.12 sec.
2025-11-14 16:09:04,521 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-10' --> 'data\processed_data\CRM\4_2024-01-10.md'
Converted 'data\edgar_documents\CRM\4_2024-01-11' --> 'data\processed_data\CRM\4_2024-01-11.md'


2025-11-14 16:09:04,549 - INFO - Going to convert document batch...
2025-11-14 16:09:04,550 - INFO - Processing document 4_2024-01-12
2025-11-14 16:09:04,612 - INFO - Finished converting document 4_2024-01-12 in 0.11 sec.
2025-11-14 16:09:04,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:04,701 - INFO - Going to convert document batch...
2025-11-14 16:09:04,702 - INFO - Processing document 4_2024-01-16
2025-11-14 16:09:04,760 - INFO - Finished converting document 4_2024-01-16 in 0.11 sec.
2025-11-14 16:09:04,826 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:04,852 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-01-12' --> 'data\processed_data\CRM\4_2024-01-12.md'
Converted 'data\edgar_documents\CRM\4_2024-01-16' --> 'data\processed_data\CRM\4_2024-01-16.md'


2025-11-14 16:09:04,855 - INFO - Processing document 4_2024-01-17
2025-11-14 16:09:04,908 - INFO - Finished converting document 4_2024-01-17 in 0.09 sec.
2025-11-14 16:09:05,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,053 - INFO - Going to convert document batch...
2025-11-14 16:09:05,054 - INFO - Processing document 4_2024-01-18
2025-11-14 16:09:05,136 - INFO - Finished converting document 4_2024-01-18 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2024-01-17' --> 'data\processed_data\CRM\4_2024-01-17.md'


2025-11-14 16:09:05,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,261 - INFO - Going to convert document batch...
2025-11-14 16:09:05,262 - INFO - Processing document 4_2024-01-19
2025-11-14 16:09:05,316 - INFO - Finished converting document 4_2024-01-19 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-01-18' --> 'data\processed_data\CRM\4_2024-01-18.md'
Converted 'data\edgar_documents\CRM\4_2024-01-19' --> 'data\processed_data\CRM\4_2024-01-19.md'


2025-11-14 16:09:05,419 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,453 - INFO - Going to convert document batch...
2025-11-14 16:09:05,455 - INFO - Processing document 4_2024-01-22
2025-11-14 16:09:05,505 - INFO - Finished converting document 4_2024-01-22 in 0.11 sec.
2025-11-14 16:09:05,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,599 - INFO - Going to convert document batch...
2025-11-14 16:09:05,600 - INFO - Processing document 4_2024-01-23
2025-11-14 16:09:05,664 - INFO - Finished converting document 4_2024-01-23 in 0.11 sec.
2025-11-14 16:09:05,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-22' --> 'data\processed_data\CRM\4_2024-01-22.md'
Converted 'data\edgar_documents\CRM\4_2024-01-23' --> 'data\processed_data\CRM\4_2024-01-23.md'


2025-11-14 16:09:05,759 - INFO - Going to convert document batch...
2025-11-14 16:09:05,760 - INFO - Processing document 4_2024-01-24
2025-11-14 16:09:05,835 - INFO - Finished converting document 4_2024-01-24 in 0.12 sec.
2025-11-14 16:09:05,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,922 - INFO - Going to convert document batch...
2025-11-14 16:09:05,924 - INFO - Processing document 4_2024-01-25
2025-11-14 16:09:05,970 - INFO - Finished converting document 4_2024-01-25 in 0.08 sec.
2025-11-14 16:09:06,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:06,069 - INFO - Going to convert document batch...
2025-11-14 16:09:06,070 - INFO - Processing document 4_2024-01-26


Converted 'data\edgar_documents\CRM\4_2024-01-24' --> 'data\processed_data\CRM\4_2024-01-24.md'
Converted 'data\edgar_documents\CRM\4_2024-01-25' --> 'data\processed_data\CRM\4_2024-01-25.md'


2025-11-14 16:09:06,113 - INFO - Finished converting document 4_2024-01-26 in 0.08 sec.
2025-11-14 16:09:06,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:06,196 - INFO - Going to convert document batch...
2025-11-14 16:09:06,197 - INFO - Processing document 4_2024-01-29
2025-11-14 16:09:06,258 - INFO - Finished converting document 4_2024-01-29 in 0.09 sec.
2025-11-14 16:09:06,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-26' --> 'data\processed_data\CRM\4_2024-01-26.md'
Converted 'data\edgar_documents\CRM\4_2024-01-29' --> 'data\processed_data\CRM\4_2024-01-29.md'


2025-11-14 16:09:06,369 - INFO - Going to convert document batch...
2025-11-14 16:09:06,371 - INFO - Processing document 4_2024-01-30
2025-11-14 16:09:06,422 - INFO - Finished converting document 4_2024-01-30 in 0.11 sec.
2025-11-14 16:09:06,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:06,513 - INFO - Going to convert document batch...
2025-11-14 16:09:06,514 - INFO - Processing document 4_2024-01-31
2025-11-14 16:09:06,576 - INFO - Finished converting document 4_2024-01-31 in 0.11 sec.
2025-11-14 16:09:06,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-30' --> 'data\processed_data\CRM\4_2024-01-30.md'
Converted 'data\edgar_documents\CRM\4_2024-01-31' --> 'data\processed_data\CRM\4_2024-01-31.md'


2025-11-14 16:09:06,682 - INFO - Going to convert document batch...
2025-11-14 16:09:06,685 - INFO - Processing document 4_2024-02-01
2025-11-14 16:09:06,743 - INFO - Finished converting document 4_2024-02-01 in 0.11 sec.
2025-11-14 16:09:06,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:06,827 - INFO - Going to convert document batch...
2025-11-14 16:09:06,829 - INFO - Processing document 4_2024-02-02
2025-11-14 16:09:06,893 - INFO - Finished converting document 4_2024-02-02 in 0.11 sec.
2025-11-14 16:09:06,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-01' --> 'data\processed_data\CRM\4_2024-02-01.md'
Converted 'data\edgar_documents\CRM\4_2024-02-02' --> 'data\processed_data\CRM\4_2024-02-02.md'


2025-11-14 16:09:07,007 - INFO - Going to convert document batch...
2025-11-14 16:09:07,009 - INFO - Processing document 4_2024-02-05
2025-11-14 16:09:07,088 - INFO - Finished converting document 4_2024-02-05 in 0.16 sec.
2025-11-14 16:09:07,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:07,210 - INFO - Going to convert document batch...
2025-11-14 16:09:07,211 - INFO - Processing document 4_2024-02-06


Converted 'data\edgar_documents\CRM\4_2024-02-05' --> 'data\processed_data\CRM\4_2024-02-05.md'


2025-11-14 16:09:07,837 - INFO - Finished converting document 4_2024-02-06 in 0.67 sec.
2025-11-14 16:09:07,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:07,935 - INFO - Going to convert document batch...
2025-11-14 16:09:07,936 - INFO - Processing document 4_2024-02-07
2025-11-14 16:09:07,994 - INFO - Finished converting document 4_2024-02-07 in 0.09 sec.
2025-11-14 16:09:08,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:08,085 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-02-06' --> 'data\processed_data\CRM\4_2024-02-06.md'
Converted 'data\edgar_documents\CRM\4_2024-02-07' --> 'data\processed_data\CRM\4_2024-02-07.md'


2025-11-14 16:09:08,086 - INFO - Processing document 4_2024-02-08
2025-11-14 16:09:08,139 - INFO - Finished converting document 4_2024-02-08 in 0.09 sec.
2025-11-14 16:09:08,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:08,250 - INFO - Going to convert document batch...
2025-11-14 16:09:08,251 - INFO - Processing document 4_2024-02-09
2025-11-14 16:09:08,298 - INFO - Finished converting document 4_2024-02-09 in 0.09 sec.
2025-11-14 16:09:08,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-08' --> 'data\processed_data\CRM\4_2024-02-08.md'
Converted 'data\edgar_documents\CRM\4_2024-02-09' --> 'data\processed_data\CRM\4_2024-02-09.md'


2025-11-14 16:09:08,408 - INFO - Going to convert document batch...
2025-11-14 16:09:08,411 - INFO - Processing document 4_2024-02-12
2025-11-14 16:09:08,473 - INFO - Finished converting document 4_2024-02-12 in 0.12 sec.
2025-11-14 16:09:08,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:08,558 - INFO - Going to convert document batch...
2025-11-14 16:09:08,562 - INFO - Processing document 4_2024-02-13
2025-11-14 16:09:08,613 - INFO - Finished converting document 4_2024-02-13 in 0.09 sec.
2025-11-14 16:09:08,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-12' --> 'data\processed_data\CRM\4_2024-02-12.md'
Converted 'data\edgar_documents\CRM\4_2024-02-13' --> 'data\processed_data\CRM\4_2024-02-13.md'


2025-11-14 16:09:08,754 - INFO - Going to convert document batch...
2025-11-14 16:09:08,757 - INFO - Processing document 4_2024-02-14
2025-11-14 16:09:08,849 - INFO - Finished converting document 4_2024-02-14 in 0.17 sec.
2025-11-14 16:09:08,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:08,987 - INFO - Going to convert document batch...
2025-11-14 16:09:08,989 - INFO - Processing document 4_2024-02-15
2025-11-14 16:09:09,077 - INFO - Finished converting document 4_2024-02-15 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2024-02-14' --> 'data\processed_data\CRM\4_2024-02-14.md'
Converted 'data\edgar_documents\CRM\4_2024-02-15' --> 'data\processed_data\CRM\4_2024-02-15.md'


2025-11-14 16:09:09,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:09,178 - INFO - Going to convert document batch...
2025-11-14 16:09:09,179 - INFO - Processing document 4_2024-02-16
2025-11-14 16:09:09,234 - INFO - Finished converting document 4_2024-02-16 in 0.11 sec.
2025-11-14 16:09:09,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:09,346 - INFO - Going to convert document batch...
2025-11-14 16:09:09,347 - INFO - Processing document 4_2024-02-20
2025-11-14 16:09:09,398 - INFO - Finished converting document 4_2024-02-20 in 0.09 sec.
2025-11-14 16:09:09,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-16' --> 'data\processed_data\CRM\4_2024-02-16.md'
Converted 'data\edgar_documents\CRM\4_2024-02-20' --> 'data\processed_data\CRM\4_2024-02-20.md'


2025-11-14 16:09:09,490 - INFO - Going to convert document batch...
2025-11-14 16:09:09,492 - INFO - Processing document 4_2024-02-21
2025-11-14 16:09:09,559 - INFO - Finished converting document 4_2024-02-21 in 0.12 sec.
2025-11-14 16:09:09,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:09,650 - INFO - Going to convert document batch...
2025-11-14 16:09:09,652 - INFO - Processing document 4_2024-02-22
2025-11-14 16:09:09,734 - INFO - Finished converting document 4_2024-02-22 in 0.12 sec.
2025-11-14 16:09:09,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-21' --> 'data\processed_data\CRM\4_2024-02-21.md'
Converted 'data\edgar_documents\CRM\4_2024-02-22' --> 'data\processed_data\CRM\4_2024-02-22.md'


2025-11-14 16:09:09,828 - INFO - Going to convert document batch...
2025-11-14 16:09:09,829 - INFO - Processing document 4_2024-02-23
2025-11-14 16:09:09,869 - INFO - Finished converting document 4_2024-02-23 in 0.08 sec.
2025-11-14 16:09:09,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:09,948 - INFO - Going to convert document batch...
2025-11-14 16:09:09,949 - INFO - Processing document 4_2024-02-26
2025-11-14 16:09:10,015 - INFO - Finished converting document 4_2024-02-26 in 0.11 sec.
2025-11-14 16:09:10,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-23' --> 'data\processed_data\CRM\4_2024-02-23.md'
Converted 'data\edgar_documents\CRM\4_2024-02-26' --> 'data\processed_data\CRM\4_2024-02-26.md'


2025-11-14 16:09:10,107 - INFO - Going to convert document batch...
2025-11-14 16:09:10,109 - INFO - Processing document 4_2024-02-27
2025-11-14 16:09:10,156 - INFO - Finished converting document 4_2024-02-27 in 0.08 sec.
2025-11-14 16:09:10,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:10,235 - INFO - Going to convert document batch...
2025-11-14 16:09:10,236 - INFO - Processing document 4_2024-02-28
2025-11-14 16:09:10,304 - INFO - Finished converting document 4_2024-02-28 in 0.09 sec.
2025-11-14 16:09:10,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-27' --> 'data\processed_data\CRM\4_2024-02-27.md'
Converted 'data\edgar_documents\CRM\4_2024-02-28' --> 'data\processed_data\CRM\4_2024-02-28.md'


2025-11-14 16:09:10,392 - INFO - Going to convert document batch...
2025-11-14 16:09:10,394 - INFO - Processing document 4_2024-02-29
2025-11-14 16:09:10,469 - INFO - Finished converting document 4_2024-02-29 in 0.12 sec.
2025-11-14 16:09:10,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:10,596 - INFO - Going to convert document batch...
2025-11-14 16:09:10,597 - INFO - Processing document 4_2024-03-01
2025-11-14 16:09:10,724 - INFO - Finished converting document 4_2024-03-01 in 0.20 sec.


Converted 'data\edgar_documents\CRM\4_2024-02-29' --> 'data\processed_data\CRM\4_2024-02-29.md'


2025-11-14 16:09:10,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:10,863 - INFO - Going to convert document batch...
2025-11-14 16:09:10,865 - INFO - Processing document 4_2024-03-04
2025-11-14 16:09:10,949 - INFO - Finished converting document 4_2024-03-04 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-01' --> 'data\processed_data\CRM\4_2024-03-01.md'


2025-11-14 16:09:11,061 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:11,080 - INFO - Going to convert document batch...
2025-11-14 16:09:11,081 - INFO - Processing document 4_2024-03-05
2025-11-14 16:09:11,133 - INFO - Finished converting document 4_2024-03-05 in 0.09 sec.
2025-11-14 16:09:11,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-03-04' --> 'data\processed_data\CRM\4_2024-03-04.md'
Converted 'data\edgar_documents\CRM\4_2024-03-05' --> 'data\processed_data\CRM\4_2024-03-05.md'


2025-11-14 16:09:11,249 - INFO - Going to convert document batch...
2025-11-14 16:09:11,250 - INFO - Processing document 4_2024-03-06
2025-11-14 16:09:11,379 - INFO - Finished converting document 4_2024-03-06 in 0.20 sec.
2025-11-14 16:09:11,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:11,574 - INFO - Going to convert document batch...
2025-11-14 16:09:11,577 - INFO - Processing document 4_2024-03-07
2025-11-14 16:09:11,628 - INFO - Finished converting document 4_2024-03-07 in 0.11 sec.
2025-11-14 16:09:11,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:11,717 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-03-06' --> 'data\processed_data\CRM\4_2024-03-06.md'
Converted 'data\edgar_documents\CRM\4_2024-03-07' --> 'data\processed_data\CRM\4_2024-03-07.md'


2025-11-14 16:09:11,718 - INFO - Processing document 4_2024-03-08
2025-11-14 16:09:11,775 - INFO - Finished converting document 4_2024-03-08 in 0.09 sec.
2025-11-14 16:09:11,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:11,859 - INFO - Going to convert document batch...
2025-11-14 16:09:11,859 - INFO - Processing document 4_2024-03-11
2025-11-14 16:09:11,922 - INFO - Finished converting document 4_2024-03-11 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-08' --> 'data\processed_data\CRM\4_2024-03-08.md'


2025-11-14 16:09:12,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,051 - INFO - Going to convert document batch...
2025-11-14 16:09:12,054 - INFO - Processing document 4_2024-03-12
2025-11-14 16:09:12,119 - INFO - Finished converting document 4_2024-03-12 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-11' --> 'data\processed_data\CRM\4_2024-03-11.md'
Converted 'data\edgar_documents\CRM\4_2024-03-12' --> 'data\processed_data\CRM\4_2024-03-12.md'


2025-11-14 16:09:12,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,259 - INFO - Going to convert document batch...
2025-11-14 16:09:12,260 - INFO - Processing document 4_2024-03-13
2025-11-14 16:09:12,439 - INFO - Finished converting document 4_2024-03-13 in 0.27 sec.
2025-11-14 16:09:12,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,535 - INFO - Going to convert document batch...
2025-11-14 16:09:12,536 - INFO - Processing document 4_2024-03-14
2025-11-14 16:09:12,581 - INFO - Finished converting document 4_2024-03-14 in 0.09 sec.
2025-11-14 16:09:12,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,682 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-03-13' --> 'data\processed_data\CRM\4_2024-03-13.md'
Converted 'data\edgar_documents\CRM\4_2024-03-14' --> 'data\processed_data\CRM\4_2024-03-14.md'


2025-11-14 16:09:12,683 - INFO - Processing document 4_2024-03-15
2025-11-14 16:09:12,745 - INFO - Finished converting document 4_2024-03-15 in 0.12 sec.
2025-11-14 16:09:12,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,851 - INFO - Going to convert document batch...
2025-11-14 16:09:12,853 - INFO - Processing document 4_2024-03-18
2025-11-14 16:09:12,917 - INFO - Finished converting document 4_2024-03-18 in 0.12 sec.
2025-11-14 16:09:12,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-03-15' --> 'data\processed_data\CRM\4_2024-03-15.md'
Converted 'data\edgar_documents\CRM\4_2024-03-18' --> 'data\processed_data\CRM\4_2024-03-18.md'


2025-11-14 16:09:13,014 - INFO - Going to convert document batch...
2025-11-14 16:09:13,016 - INFO - Processing document 4_2024-03-19
2025-11-14 16:09:13,069 - INFO - Finished converting document 4_2024-03-19 in 0.09 sec.
2025-11-14 16:09:13,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:13,167 - INFO - Going to convert document batch...
2025-11-14 16:09:13,168 - INFO - Processing document 4_2024-03-20
2025-11-14 16:09:13,240 - INFO - Finished converting document 4_2024-03-20 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-19' --> 'data\processed_data\CRM\4_2024-03-19.md'
Converted 'data\edgar_documents\CRM\4_2024-03-20' --> 'data\processed_data\CRM\4_2024-03-20.md'


2025-11-14 16:09:13,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:13,348 - INFO - Going to convert document batch...
2025-11-14 16:09:13,350 - INFO - Processing document 4_2024-03-21
2025-11-14 16:09:13,400 - INFO - Finished converting document 4_2024-03-21 in 0.09 sec.
2025-11-14 16:09:13,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:13,598 - INFO - Going to convert document batch...
2025-11-14 16:09:13,599 - INFO - Processing document 4_2024-03-22
2025-11-14 16:09:13,639 - INFO - Finished converting document 4_2024-03-22 in 0.12 sec.
2025-11-14 16:09:13,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-03-21' --> 'data\processed_data\CRM\4_2024-03-21.md'
Converted 'data\edgar_documents\CRM\4_2024-03-22' --> 'data\processed_data\CRM\4_2024-03-22.md'


2025-11-14 16:09:13,742 - INFO - Going to convert document batch...
2025-11-14 16:09:13,745 - INFO - Processing document 4_2024-03-25
2025-11-14 16:09:13,816 - INFO - Finished converting document 4_2024-03-25 in 0.14 sec.
2025-11-14 16:09:13,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:13,899 - INFO - Going to convert document batch...
2025-11-14 16:09:13,900 - INFO - Processing document 4_2024-03-26
2025-11-14 16:09:13,974 - INFO - Finished converting document 4_2024-03-26 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-25' --> 'data\processed_data\CRM\4_2024-03-25.md'


2025-11-14 16:09:14,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-03-26' --> 'data\processed_data\CRM\4_2024-03-26.md'


2025-11-14 16:09:14,661 - INFO - Going to convert document batch...
2025-11-14 16:09:14,662 - INFO - Processing document 4_2024-03-27
2025-11-14 16:09:14,737 - INFO - Finished converting document 4_2024-03-27 in 0.67 sec.
2025-11-14 16:09:14,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:14,830 - INFO - Going to convert document batch...
2025-11-14 16:09:14,831 - INFO - Processing document 4_2024-03-28
2025-11-14 16:09:14,902 - INFO - Finished converting document 4_2024-03-28 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-27' --> 'data\processed_data\CRM\4_2024-03-27.md'


2025-11-14 16:09:14,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,010 - INFO - Going to convert document batch...
2025-11-14 16:09:15,011 - INFO - Processing document 4_2024-03-29
2025-11-14 16:09:15,055 - INFO - Finished converting document 4_2024-03-29 in 0.08 sec.
2025-11-14 16:09:15,126 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,148 - INFO - Going to convert document batch...
2025-11-14 16:09:15,150 - INFO - Processing document 4_2024-04-02


Converted 'data\edgar_documents\CRM\4_2024-03-28' --> 'data\processed_data\CRM\4_2024-03-28.md'
Converted 'data\edgar_documents\CRM\4_2024-03-29' --> 'data\processed_data\CRM\4_2024-03-29.md'


2025-11-14 16:09:15,229 - INFO - Finished converting document 4_2024-04-02 in 0.14 sec.
2025-11-14 16:09:15,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,345 - INFO - Going to convert document batch...
2025-11-14 16:09:15,346 - INFO - Processing document 4_2024-04-03
2025-11-14 16:09:15,431 - INFO - Finished converting document 4_2024-04-03 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-02' --> 'data\processed_data\CRM\4_2024-04-02.md'


2025-11-14 16:09:15,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,550 - INFO - Going to convert document batch...
2025-11-14 16:09:15,551 - INFO - Processing document 4_2024-04-04
2025-11-14 16:09:15,636 - INFO - Finished converting document 4_2024-04-04 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-03' --> 'data\processed_data\CRM\4_2024-04-03.md'
Converted 'data\edgar_documents\CRM\4_2024-04-04' --> 'data\processed_data\CRM\4_2024-04-04.md'


2025-11-14 16:09:15,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,770 - INFO - Going to convert document batch...
2025-11-14 16:09:15,772 - INFO - Processing document 4_2024-04-05
2025-11-14 16:09:15,861 - INFO - Finished converting document 4_2024-04-05 in 0.16 sec.
2025-11-14 16:09:15,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,052 - INFO - Going to convert document batch...
2025-11-14 16:09:16,055 - INFO - Processing document 4_2024-04-08
2025-11-14 16:09:16,155 - INFO - Finished converting document 4_2024-04-08 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-05' --> 'data\processed_data\CRM\4_2024-04-05.md'


2025-11-14 16:09:16,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,254 - INFO - Going to convert document batch...
2025-11-14 16:09:16,255 - INFO - Processing document 4_2024-04-09
2025-11-14 16:09:16,312 - INFO - Finished converting document 4_2024-04-09 in 0.09 sec.
2025-11-14 16:09:16,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,395 - INFO - Going to convert document batch...
2025-11-14 16:09:16,396 - INFO - Processing document 4_2024-04-10


Converted 'data\edgar_documents\CRM\4_2024-04-08' --> 'data\processed_data\CRM\4_2024-04-08.md'
Converted 'data\edgar_documents\CRM\4_2024-04-09' --> 'data\processed_data\CRM\4_2024-04-09.md'


2025-11-14 16:09:16,429 - INFO - Finished converting document 4_2024-04-10 in 0.06 sec.
2025-11-14 16:09:16,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,528 - INFO - Going to convert document batch...
2025-11-14 16:09:16,529 - INFO - Processing document 4_2024-04-11
2025-11-14 16:09:16,576 - INFO - Finished converting document 4_2024-04-11 in 0.11 sec.
2025-11-14 16:09:16,648 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,666 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-04-10' --> 'data\processed_data\CRM\4_2024-04-10.md'
Converted 'data\edgar_documents\CRM\4_2024-04-11' --> 'data\processed_data\CRM\4_2024-04-11.md'


2025-11-14 16:09:16,668 - INFO - Processing document 4_2024-04-12
2025-11-14 16:09:16,730 - INFO - Finished converting document 4_2024-04-12 in 0.11 sec.
2025-11-14 16:09:16,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,898 - INFO - Going to convert document batch...
2025-11-14 16:09:16,899 - INFO - Processing document 4_2024-04-15
2025-11-14 16:09:16,955 - INFO - Finished converting document 4_2024-04-15 in 0.12 sec.
2025-11-14 16:09:17,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-04-12' --> 'data\processed_data\CRM\4_2024-04-12.md'
Converted 'data\edgar_documents\CRM\4_2024-04-15' --> 'data\processed_data\CRM\4_2024-04-15.md'


2025-11-14 16:09:17,099 - INFO - Going to convert document batch...
2025-11-14 16:09:17,100 - INFO - Processing document 4_2024-04-16
2025-11-14 16:09:17,222 - INFO - Finished converting document 4_2024-04-16 in 0.22 sec.
2025-11-14 16:09:17,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:17,362 - INFO - Going to convert document batch...
2025-11-14 16:09:17,364 - INFO - Processing document 4_2024-04-17
2025-11-14 16:09:17,432 - INFO - Finished converting document 4_2024-04-17 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-16' --> 'data\processed_data\CRM\4_2024-04-16.md'
Converted 'data\edgar_documents\CRM\4_2024-04-17' --> 'data\processed_data\CRM\4_2024-04-17.md'


2025-11-14 16:09:17,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:17,567 - INFO - Going to convert document batch...
2025-11-14 16:09:17,570 - INFO - Processing document 4_2024-04-18
2025-11-14 16:09:17,671 - INFO - Finished converting document 4_2024-04-18 in 0.17 sec.
2025-11-14 16:09:17,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:17,818 - INFO - Going to convert document batch...
2025-11-14 16:09:17,820 - INFO - Processing document 4_2024-04-19
2025-11-14 16:09:17,895 - INFO - Finished converting document 4_2024-04-19 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-18' --> 'data\processed_data\CRM\4_2024-04-18.md'
Converted 'data\edgar_documents\CRM\4_2024-04-19' --> 'data\processed_data\CRM\4_2024-04-19.md'


2025-11-14 16:09:17,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:17,993 - INFO - Going to convert document batch...
2025-11-14 16:09:17,994 - INFO - Processing document 4_2024-04-22
2025-11-14 16:09:18,043 - INFO - Finished converting document 4_2024-04-22 in 0.09 sec.
2025-11-14 16:09:18,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,178 - INFO - Going to convert document batch...
2025-11-14 16:09:18,179 - INFO - Processing document 4_2024-04-23
2025-11-14 16:09:18,281 - INFO - Finished converting document 4_2024-04-23 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-22' --> 'data\processed_data\CRM\4_2024-04-22.md'


2025-11-14 16:09:18,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,416 - INFO - Going to convert document batch...
2025-11-14 16:09:18,417 - INFO - Processing document 4_2024-04-24
2025-11-14 16:09:18,494 - INFO - Finished converting document 4_2024-04-24 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-23' --> 'data\processed_data\CRM\4_2024-04-23.md'
Converted 'data\edgar_documents\CRM\4_2024-04-24' --> 'data\processed_data\CRM\4_2024-04-24.md'


2025-11-14 16:09:18,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,602 - INFO - Going to convert document batch...
2025-11-14 16:09:18,603 - INFO - Processing document 4_2024-04-25
2025-11-14 16:09:18,638 - INFO - Finished converting document 4_2024-04-25 in 0.08 sec.
2025-11-14 16:09:18,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,706 - INFO - Going to convert document batch...
2025-11-14 16:09:18,708 - INFO - Processing document 4_2024-04-26
2025-11-14 16:09:18,756 - INFO - Finished converting document 4_2024-04-26 in 0.08 sec.
2025-11-14 16:09:18,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,865 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-04-25' --> 'data\processed_data\CRM\4_2024-04-25.md'
Converted 'data\edgar_documents\CRM\4_2024-04-26' --> 'data\processed_data\CRM\4_2024-04-26.md'


2025-11-14 16:09:18,867 - INFO - Processing document 4_2024-04-29
2025-11-14 16:09:18,916 - INFO - Finished converting document 4_2024-04-29 in 0.09 sec.
2025-11-14 16:09:18,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,005 - INFO - Going to convert document batch...
2025-11-14 16:09:19,006 - INFO - Processing document 4_2024-04-30
2025-11-14 16:09:19,072 - INFO - Finished converting document 4_2024-04-30 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-29' --> 'data\processed_data\CRM\4_2024-04-29.md'
Converted 'data\edgar_documents\CRM\4_2024-04-30' --> 'data\processed_data\CRM\4_2024-04-30.md'


2025-11-14 16:09:19,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,248 - INFO - Going to convert document batch...
2025-11-14 16:09:19,249 - INFO - Processing document 4_2024-05-01
2025-11-14 16:09:19,367 - INFO - Finished converting document 4_2024-05-01 in 0.20 sec.
2025-11-14 16:09:19,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,541 - INFO - Going to convert document batch...
2025-11-14 16:09:19,542 - INFO - Processing document 4_2024-05-02
2025-11-14 16:09:19,598 - INFO - Finished converting document 4_2024-05-02 in 0.09 sec.
2025-11-14 16:09:19,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,694 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-05-01' --> 'data\processed_data\CRM\4_2024-05-01.md'
Converted 'data\edgar_documents\CRM\4_2024-05-02' --> 'data\processed_data\CRM\4_2024-05-02.md'


2025-11-14 16:09:19,695 - INFO - Processing document 4_2024-05-03
2025-11-14 16:09:19,750 - INFO - Finished converting document 4_2024-05-03 in 0.11 sec.
2025-11-14 16:09:19,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,841 - INFO - Going to convert document batch...
2025-11-14 16:09:19,842 - INFO - Processing document 4_2024-05-06
2025-11-14 16:09:19,900 - INFO - Finished converting document 4_2024-05-06 in 0.09 sec.
2025-11-14 16:09:19,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,981 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-05-03' --> 'data\processed_data\CRM\4_2024-05-03.md'
Converted 'data\edgar_documents\CRM\4_2024-05-06' --> 'data\processed_data\CRM\4_2024-05-06.md'


2025-11-14 16:09:19,982 - INFO - Processing document 4_2024-05-07
2025-11-14 16:09:20,027 - INFO - Finished converting document 4_2024-05-07 in 0.08 sec.
2025-11-14 16:09:20,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,126 - INFO - Going to convert document batch...
2025-11-14 16:09:20,127 - INFO - Processing document 4_2024-05-08
2025-11-14 16:09:20,280 - INFO - Finished converting document 4_2024-05-08 in 0.20 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-07' --> 'data\processed_data\CRM\4_2024-05-07.md'


2025-11-14 16:09:20,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,367 - INFO - Going to convert document batch...
2025-11-14 16:09:20,369 - INFO - Processing document 4_2024-05-09
2025-11-14 16:09:20,413 - INFO - Finished converting document 4_2024-05-09 in 0.08 sec.
2025-11-14 16:09:20,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,509 - INFO - Going to convert document batch...
2025-11-14 16:09:20,510 - INFO - Processing document 4_2024-05-10


Converted 'data\edgar_documents\CRM\4_2024-05-08' --> 'data\processed_data\CRM\4_2024-05-08.md'
Converted 'data\edgar_documents\CRM\4_2024-05-09' --> 'data\processed_data\CRM\4_2024-05-09.md'


2025-11-14 16:09:20,567 - INFO - Finished converting document 4_2024-05-10 in 0.11 sec.
2025-11-14 16:09:20,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,664 - INFO - Going to convert document batch...
2025-11-14 16:09:20,665 - INFO - Processing document 4_2024-05-13
2025-11-14 16:09:20,715 - INFO - Finished converting document 4_2024-05-13 in 0.09 sec.
2025-11-14 16:09:20,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,800 - INFO - Going to convert document batch...
2025-11-14 16:09:20,801 - INFO - Processing document 4_2024-05-14


Converted 'data\edgar_documents\CRM\4_2024-05-10' --> 'data\processed_data\CRM\4_2024-05-10.md'
Converted 'data\edgar_documents\CRM\4_2024-05-13' --> 'data\processed_data\CRM\4_2024-05-13.md'


2025-11-14 16:09:20,856 - INFO - Finished converting document 4_2024-05-14 in 0.11 sec.
2025-11-14 16:09:20,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,990 - INFO - Going to convert document batch...
2025-11-14 16:09:20,992 - INFO - Processing document 4_2024-05-15
2025-11-14 16:09:21,058 - INFO - Finished converting document 4_2024-05-15 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-14' --> 'data\processed_data\CRM\4_2024-05-14.md'
Converted 'data\edgar_documents\CRM\4_2024-05-15' --> 'data\processed_data\CRM\4_2024-05-15.md'


2025-11-14 16:09:21,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:21,158 - INFO - Going to convert document batch...
2025-11-14 16:09:21,160 - INFO - Processing document 4_2024-05-16
2025-11-14 16:09:21,200 - INFO - Finished converting document 4_2024-05-16 in 0.09 sec.
2025-11-14 16:09:21,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-05-16' --> 'data\processed_data\CRM\4_2024-05-16.md'


2025-11-14 16:09:21,933 - INFO - Going to convert document batch...
2025-11-14 16:09:21,936 - INFO - Processing document 4_2024-05-17
2025-11-14 16:09:22,000 - INFO - Finished converting document 4_2024-05-17 in 0.77 sec.
2025-11-14 16:09:22,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:22,097 - INFO - Going to convert document batch...
2025-11-14 16:09:22,098 - INFO - Processing document 4_2024-05-20
2025-11-14 16:09:22,152 - INFO - Finished converting document 4_2024-05-20 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-17' --> 'data\processed_data\CRM\4_2024-05-17.md'


2025-11-14 16:09:22,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:22,324 - INFO - Going to convert document batch...
2025-11-14 16:09:22,325 - INFO - Processing document 4_2024-05-21
2025-11-14 16:09:22,380 - INFO - Finished converting document 4_2024-05-21 in 0.09 sec.
2025-11-14 16:09:22,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-05-20' --> 'data\processed_data\CRM\4_2024-05-20.md'
Converted 'data\edgar_documents\CRM\4_2024-05-21' --> 'data\processed_data\CRM\4_2024-05-21.md'


2025-11-14 16:09:22,476 - INFO - Going to convert document batch...
2025-11-14 16:09:22,479 - INFO - Processing document 4_2024-05-22
2025-11-14 16:09:22,561 - INFO - Finished converting document 4_2024-05-22 in 0.14 sec.
2025-11-14 16:09:22,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:22,682 - INFO - Going to convert document batch...
2025-11-14 16:09:22,683 - INFO - Processing document 4_2024-05-23
2025-11-14 16:09:22,749 - INFO - Finished converting document 4_2024-05-23 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-22' --> 'data\processed_data\CRM\4_2024-05-22.md'
Converted 'data\edgar_documents\CRM\4_2024-05-23' --> 'data\processed_data\CRM\4_2024-05-23.md'


2025-11-14 16:09:22,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:22,868 - INFO - Going to convert document batch...
2025-11-14 16:09:22,870 - INFO - Processing document 4_2024-05-24
2025-11-14 16:09:22,965 - INFO - Finished converting document 4_2024-05-24 in 0.16 sec.
2025-11-14 16:09:23,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:23,067 - INFO - Going to convert document batch...
2025-11-14 16:09:23,068 - INFO - Processing document 4_2024-05-28
2025-11-14 16:09:23,132 - INFO - Finished converting document 4_2024-05-28 in 0.09 sec.
2025-11-14 16:09:23,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-05-24' --> 'data\processed_data\CRM\4_2024-05-24.md'
Converted 'data\edgar_documents\CRM\4_2024-05-28' --> 'data\processed_data\CRM\4_2024-05-28.md'


2025-11-14 16:09:23,269 - INFO - Going to convert document batch...
2025-11-14 16:09:23,272 - INFO - Processing document 4_2024-05-29
2025-11-14 16:09:23,353 - INFO - Finished converting document 4_2024-05-29 in 0.16 sec.
2025-11-14 16:09:23,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:23,473 - INFO - Going to convert document batch...
2025-11-14 16:09:23,479 - INFO - Processing document 4_2024-05-30
2025-11-14 16:09:23,555 - INFO - Finished converting document 4_2024-05-30 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-29' --> 'data\processed_data\CRM\4_2024-05-29.md'
Converted 'data\edgar_documents\CRM\4_2024-05-30' --> 'data\processed_data\CRM\4_2024-05-30.md'


2025-11-14 16:09:23,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:23,678 - INFO - Going to convert document batch...
2025-11-14 16:09:23,679 - INFO - Processing document 4_2024-05-31
2025-11-14 16:09:23,757 - INFO - Finished converting document 4_2024-05-31 in 0.16 sec.
2025-11-14 16:09:23,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:23,944 - INFO - Going to convert document batch...
2025-11-14 16:09:23,946 - INFO - Processing document 4_2024-06-03


Converted 'data\edgar_documents\CRM\4_2024-05-31' --> 'data\processed_data\CRM\4_2024-05-31.md'


2025-11-14 16:09:24,059 - INFO - Finished converting document 4_2024-06-03 in 0.22 sec.
2025-11-14 16:09:24,244 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:24,283 - INFO - Going to convert document batch...
2025-11-14 16:09:24,284 - INFO - Processing document 4_2024-06-04
2025-11-14 16:09:24,350 - INFO - Finished converting document 4_2024-06-04 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-06-03' --> 'data\processed_data\CRM\4_2024-06-03.md'


2025-11-14 16:09:24,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:24,557 - INFO - Going to convert document batch...
2025-11-14 16:09:24,559 - INFO - Processing document 4_2024-06-05


Converted 'data\edgar_documents\CRM\4_2024-06-04' --> 'data\processed_data\CRM\4_2024-06-04.md'


2025-11-14 16:09:24,672 - INFO - Finished converting document 4_2024-06-05 in 0.23 sec.
2025-11-14 16:09:24,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:24,806 - INFO - Going to convert document batch...
2025-11-14 16:09:24,808 - INFO - Processing document 4_2024-06-06
2025-11-14 16:09:24,877 - INFO - Finished converting document 4_2024-06-06 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-06-05' --> 'data\processed_data\CRM\4_2024-06-05.md'


2025-11-14 16:09:24,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,056 - INFO - Going to convert document batch...
2025-11-14 16:09:25,060 - INFO - Processing document 4_2024-06-07


Converted 'data\edgar_documents\CRM\4_2024-06-06' --> 'data\processed_data\CRM\4_2024-06-06.md'


2025-11-14 16:09:25,146 - INFO - Finished converting document 4_2024-06-07 in 0.20 sec.
2025-11-14 16:09:25,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,249 - INFO - Going to convert document batch...
2025-11-14 16:09:25,251 - INFO - Processing document 4_2024-06-10
2025-11-14 16:09:25,307 - INFO - Finished converting document 4_2024-06-10 in 0.09 sec.
2025-11-14 16:09:25,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,403 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-06-07' --> 'data\processed_data\CRM\4_2024-06-07.md'
Converted 'data\edgar_documents\CRM\4_2024-06-10' --> 'data\processed_data\CRM\4_2024-06-10.md'


2025-11-14 16:09:25,404 - INFO - Processing document 4_2024-06-11
2025-11-14 16:09:25,449 - INFO - Finished converting document 4_2024-06-11 in 0.09 sec.
2025-11-14 16:09:25,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,527 - INFO - Going to convert document batch...
2025-11-14 16:09:25,528 - INFO - Processing document 4_2024-06-12
2025-11-14 16:09:25,569 - INFO - Finished converting document 4_2024-06-12 in 0.06 sec.
2025-11-14 16:09:25,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-06-11' --> 'data\processed_data\CRM\4_2024-06-11.md'
Converted 'data\edgar_documents\CRM\4_2024-06-12' --> 'data\processed_data\CRM\4_2024-06-12.md'


2025-11-14 16:09:25,718 - INFO - Going to convert document batch...
2025-11-14 16:09:25,724 - INFO - Processing document 4_2024-06-20
2025-11-14 16:09:25,809 - INFO - Finished converting document 4_2024-06-20 in 0.17 sec.
2025-11-14 16:09:25,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,946 - INFO - Going to convert document batch...
2025-11-14 16:09:25,948 - INFO - Processing document 4_2024-06-24
2025-11-14 16:09:26,001 - INFO - Finished converting document 4_2024-06-24 in 0.12 sec.
2025-11-14 16:09:26,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-06-20' --> 'data\processed_data\CRM\4_2024-06-20.md'
Converted 'data\edgar_documents\CRM\4_2024-06-24' --> 'data\processed_data\CRM\4_2024-06-24.md'


2025-11-14 16:09:26,090 - INFO - Going to convert document batch...
2025-11-14 16:09:26,092 - INFO - Processing document 4_2024-06-25
2025-11-14 16:09:26,131 - INFO - Finished converting document 4_2024-06-25 in 0.08 sec.
2025-11-14 16:09:26,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:26,208 - INFO - Going to convert document batch...
2025-11-14 16:09:26,209 - INFO - Processing document 4_2024-06-26
2025-11-14 16:09:26,247 - INFO - Finished converting document 4_2024-06-26 in 0.08 sec.
2025-11-14 16:09:26,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:26,328 - INFO - Going to convert document batch...
2025-11-14 16:09:26,330 - INFO - Processing document 4_2024-06-28


Converted 'data\edgar_documents\CRM\4_2024-06-25' --> 'data\processed_data\CRM\4_2024-06-25.md'
Converted 'data\edgar_documents\CRM\4_2024-06-26' --> 'data\processed_data\CRM\4_2024-06-26.md'


2025-11-14 16:09:26,389 - INFO - Finished converting document 4_2024-06-28 in 0.11 sec.
2025-11-14 16:09:26,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:26,522 - INFO - Going to convert document batch...
2025-11-14 16:09:26,525 - INFO - Processing document 4_2024-07-01
2025-11-14 16:09:26,606 - INFO - Finished converting document 4_2024-07-01 in 0.14 sec.
2025-11-14 16:09:26,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-06-28' --> 'data\processed_data\CRM\4_2024-06-28.md'
Converted 'data\edgar_documents\CRM\4_2024-07-01' --> 'data\processed_data\CRM\4_2024-07-01.md'


2025-11-14 16:09:26,704 - INFO - Going to convert document batch...
2025-11-14 16:09:26,706 - INFO - Processing document 4_2024-07-03
2025-11-14 16:09:26,769 - INFO - Finished converting document 4_2024-07-03 in 0.12 sec.
2025-11-14 16:09:26,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:26,869 - INFO - Going to convert document batch...
2025-11-14 16:09:26,871 - INFO - Processing document 4_2024-07-10
2025-11-14 16:09:26,932 - INFO - Finished converting document 4_2024-07-10 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2024-07-03' --> 'data\processed_data\CRM\4_2024-07-03.md'
Converted 'data\edgar_documents\CRM\4_2024-07-10' --> 'data\processed_data\CRM\4_2024-07-10.md'


2025-11-14 16:09:27,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,067 - INFO - Going to convert document batch...
2025-11-14 16:09:27,068 - INFO - Processing document 4_2024-07-17
2025-11-14 16:09:27,132 - INFO - Finished converting document 4_2024-07-17 in 0.12 sec.
2025-11-14 16:09:27,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,221 - INFO - Going to convert document batch...
2025-11-14 16:09:27,222 - INFO - Processing document 4_2024-07-23
2025-11-14 16:09:27,263 - INFO - Finished converting document 4_2024-07-23 in 0.08 sec.
2025-11-14 16:09:27,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,367 - INFO - Going to convert document batch...
2025-11-14 16:09:27,368 - INFO - Processing document 4_2024-07-24


Converted 'data\edgar_documents\CRM\4_2024-07-17' --> 'data\processed_data\CRM\4_2024-07-17.md'
Converted 'data\edgar_documents\CRM\4_2024-07-23' --> 'data\processed_data\CRM\4_2024-07-23.md'


2025-11-14 16:09:27,429 - INFO - Finished converting document 4_2024-07-24 in 0.12 sec.
2025-11-14 16:09:27,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,510 - INFO - Going to convert document batch...
2025-11-14 16:09:27,512 - INFO - Processing document 4_2024-07-25
2025-11-14 16:09:27,549 - INFO - Finished converting document 4_2024-07-25 in 0.08 sec.
2025-11-14 16:09:27,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,639 - INFO - Going to convert document batch...
2025-11-14 16:09:27,641 - INFO - Processing document 4_2024-07-26


Converted 'data\edgar_documents\CRM\4_2024-07-24' --> 'data\processed_data\CRM\4_2024-07-24.md'
Converted 'data\edgar_documents\CRM\4_2024-07-25' --> 'data\processed_data\CRM\4_2024-07-25.md'


2025-11-14 16:09:27,683 - INFO - Finished converting document 4_2024-07-26 in 0.09 sec.
2025-11-14 16:09:27,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,774 - INFO - Going to convert document batch...
2025-11-14 16:09:27,775 - INFO - Processing document 4_2024-07-31
2025-11-14 16:09:27,858 - INFO - Finished converting document 4_2024-07-31 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-07-26' --> 'data\processed_data\CRM\4_2024-07-26.md'


2025-11-14 16:09:27,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,969 - INFO - Going to convert document batch...
2025-11-14 16:09:28,424 - INFO - Processing document 4_2024-08-07


Converted 'data\edgar_documents\CRM\4_2024-07-31' --> 'data\processed_data\CRM\4_2024-07-31.md'


2025-11-14 16:09:28,583 - INFO - Finished converting document 4_2024-08-07 in 0.66 sec.
2025-11-14 16:09:28,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:28,700 - INFO - Going to convert document batch...
2025-11-14 16:09:28,701 - INFO - Processing document 4_2024-08-12
2025-11-14 16:09:28,755 - INFO - Finished converting document 4_2024-08-12 in 0.09 sec.
2025-11-14 16:09:28,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:28,863 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-08-07' --> 'data\processed_data\CRM\4_2024-08-07.md'
Converted 'data\edgar_documents\CRM\4_2024-08-12' --> 'data\processed_data\CRM\4_2024-08-12.md'


2025-11-14 16:09:28,864 - INFO - Processing document 4_2024-08-14
2025-11-14 16:09:28,938 - INFO - Finished converting document 4_2024-08-14 in 0.12 sec.
2025-11-14 16:09:29,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,066 - INFO - Going to convert document batch...
2025-11-14 16:09:29,068 - INFO - Processing document 4_2024-08-21


Converted 'data\edgar_documents\CRM\4_2024-08-14' --> 'data\processed_data\CRM\4_2024-08-14.md'


2025-11-14 16:09:29,264 - INFO - Finished converting document 4_2024-08-21 in 0.25 sec.
2025-11-14 16:09:29,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,378 - INFO - Going to convert document batch...
2025-11-14 16:09:29,379 - INFO - Processing document 4_2024-08-23
2025-11-14 16:09:29,416 - INFO - Finished converting document 4_2024-08-23 in 0.09 sec.
2025-11-14 16:09:29,481 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,511 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-08-21' --> 'data\processed_data\CRM\4_2024-08-21.md'
Converted 'data\edgar_documents\CRM\4_2024-08-23' --> 'data\processed_data\CRM\4_2024-08-23.md'


2025-11-14 16:09:29,512 - INFO - Processing document 4_2024-08-28
2025-11-14 16:09:29,579 - INFO - Finished converting document 4_2024-08-28 in 0.12 sec.
2025-11-14 16:09:29,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,683 - INFO - Going to convert document batch...
2025-11-14 16:09:29,685 - INFO - Processing document 4_2024-09-05
2025-11-14 16:09:29,756 - INFO - Finished converting document 4_2024-09-05 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-08-28' --> 'data\processed_data\CRM\4_2024-08-28.md'


2025-11-14 16:09:29,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,859 - INFO - Going to convert document batch...
2025-11-14 16:09:29,860 - INFO - Processing document 4_2024-09-11
2025-11-14 16:09:29,946 - INFO - Finished converting document 4_2024-09-11 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-09-05' --> 'data\processed_data\CRM\4_2024-09-05.md'


2025-11-14 16:09:30,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,050 - INFO - Going to convert document batch...
2025-11-14 16:09:30,052 - INFO - Processing document 4_2024-09-12
2025-11-14 16:09:30,086 - INFO - Finished converting document 4_2024-09-12 in 0.06 sec.
2025-11-14 16:09:30,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,175 - INFO - Going to convert document batch...
2025-11-14 16:09:30,176 - INFO - Processing document 4_2024-09-18


Converted 'data\edgar_documents\CRM\4_2024-09-11' --> 'data\processed_data\CRM\4_2024-09-11.md'
Converted 'data\edgar_documents\CRM\4_2024-09-12' --> 'data\processed_data\CRM\4_2024-09-12.md'


2025-11-14 16:09:30,245 - INFO - Finished converting document 4_2024-09-18 in 0.14 sec.
2025-11-14 16:09:30,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,369 - INFO - Going to convert document batch...
2025-11-14 16:09:30,372 - INFO - Processing document 4_2024-09-23
2025-11-14 16:09:30,435 - INFO - Finished converting document 4_2024-09-23 in 0.12 sec.
2025-11-14 16:09:30,490 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,506 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-09-18' --> 'data\processed_data\CRM\4_2024-09-18.md'
Converted 'data\edgar_documents\CRM\4_2024-09-23' --> 'data\processed_data\CRM\4_2024-09-23.md'


2025-11-14 16:09:30,507 - INFO - Processing document 4_2024-09-25
2025-11-14 16:09:30,541 - INFO - Finished converting document 4_2024-09-25 in 0.06 sec.
2025-11-14 16:09:30,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,607 - INFO - Going to convert document batch...
2025-11-14 16:09:30,608 - INFO - Processing document 4_2024-09-27
2025-11-14 16:09:30,645 - INFO - Finished converting document 4_2024-09-27 in 0.06 sec.
2025-11-14 16:09:30,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,734 - INFO - Going to convert document batch...
2025-11-14 16:09:30,738 - INFO - Processing document 4_2024-10-02


Converted 'data\edgar_documents\CRM\4_2024-09-25' --> 'data\processed_data\CRM\4_2024-09-25.md'
Converted 'data\edgar_documents\CRM\4_2024-09-27' --> 'data\processed_data\CRM\4_2024-09-27.md'


2025-11-14 16:09:30,820 - INFO - Finished converting document 4_2024-10-02 in 0.12 sec.
2025-11-14 16:09:30,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,906 - INFO - Going to convert document batch...
2025-11-14 16:09:30,907 - INFO - Processing document 4_2024-10-03
2025-11-14 16:09:30,940 - INFO - Finished converting document 4_2024-10-03 in 0.06 sec.
2025-11-14 16:09:30,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,028 - INFO - Going to convert document batch...
2025-11-14 16:09:31,030 - INFO - Processing document 4_2024-10-09


Converted 'data\edgar_documents\CRM\4_2024-10-02' --> 'data\processed_data\CRM\4_2024-10-02.md'
Converted 'data\edgar_documents\CRM\4_2024-10-03' --> 'data\processed_data\CRM\4_2024-10-03.md'


2025-11-14 16:09:31,150 - INFO - Finished converting document 4_2024-10-09 in 0.17 sec.
2025-11-14 16:09:31,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,294 - INFO - Going to convert document batch...
2025-11-14 16:09:31,295 - INFO - Processing document 4_2024-10-16
2025-11-14 16:09:31,360 - INFO - Finished converting document 4_2024-10-16 in 0.12 sec.
2025-11-14 16:09:31,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-10-09' --> 'data\processed_data\CRM\4_2024-10-09.md'
Converted 'data\edgar_documents\CRM\4_2024-10-16' --> 'data\processed_data\CRM\4_2024-10-16.md'


2025-11-14 16:09:31,459 - INFO - Going to convert document batch...
2025-11-14 16:09:31,461 - INFO - Processing document 4_2024-10-22
2025-11-14 16:09:31,520 - INFO - Finished converting document 4_2024-10-22 in 0.09 sec.
2025-11-14 16:09:31,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,596 - INFO - Going to convert document batch...
2025-11-14 16:09:31,596 - INFO - Processing document 4_2024-10-23
2025-11-14 16:09:31,639 - INFO - Finished converting document 4_2024-10-23 in 0.08 sec.
2025-11-14 16:09:31,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,719 - INFO - Going to convert document batch...
2025-11-14 16:09:31,723 - INFO - Processing document 4_2024-10-25
2025-11-14 16:09:31,766 - INFO - Finished converting document 4_2024-10-25 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2024-10-22' --> 'data\processed_data\CRM\4_2024-10-22.md'
Converted 'data\edgar_documents\CRM\4_2024-10-23' --> 'data\processed_data\CRM\4_2024-10-23.md'


2025-11-14 16:09:31,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,843 - INFO - Going to convert document batch...
2025-11-14 16:09:31,844 - INFO - Processing document 4_2024-10-30
2025-11-14 16:09:31,885 - INFO - Finished converting document 4_2024-10-30 in 0.09 sec.
2025-11-14 16:09:31,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,974 - INFO - Going to convert document batch...
2025-11-14 16:09:31,975 - INFO - Processing document 4_2024-11-04


Converted 'data\edgar_documents\CRM\4_2024-10-25' --> 'data\processed_data\CRM\4_2024-10-25.md'
Converted 'data\edgar_documents\CRM\4_2024-10-30' --> 'data\processed_data\CRM\4_2024-10-30.md'


2025-11-14 16:09:32,014 - INFO - Finished converting document 4_2024-11-04 in 0.08 sec.
2025-11-14 16:09:32,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:32,096 - INFO - Going to convert document batch...
2025-11-14 16:09:32,097 - INFO - Processing document 4_2024-11-06
2025-11-14 16:09:32,160 - INFO - Finished converting document 4_2024-11-06 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-11-04' --> 'data\processed_data\CRM\4_2024-11-04.md'
Converted 'data\edgar_documents\CRM\4_2024-11-06' --> 'data\processed_data\CRM\4_2024-11-06.md'


2025-11-14 16:09:32,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:32,275 - INFO - Going to convert document batch...
2025-11-14 16:09:32,277 - INFO - Processing document 4_2024-11-22
2025-11-14 16:09:32,370 - INFO - Finished converting document 4_2024-11-22 in 0.16 sec.
2025-11-14 16:09:32,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:32,460 - INFO - Going to convert document batch...
2025-11-14 16:09:32,461 - INFO - Processing document 4_2024-11-25
2025-11-14 16:09:32,512 - INFO - Finished converting document 4_2024-11-25 in 0.09 sec.
2025-11-14 16:09:32,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-11-22' --> 'data\processed_data\CRM\4_2024-11-22.md'
Converted 'data\edgar_documents\CRM\4_2024-11-25' --> 'data\processed_data\CRM\4_2024-11-25.md'


2025-11-14 16:09:32,638 - INFO - Going to convert document batch...
2025-11-14 16:09:32,640 - INFO - Processing document 4_2024-11-26
2025-11-14 16:09:32,677 - INFO - Finished converting document 4_2024-11-26 in 0.09 sec.
2025-11-14 16:09:32,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:32,800 - INFO - Going to convert document batch...
2025-11-14 16:09:32,801 - INFO - Processing document 4_2024-12-20
2025-11-14 16:09:32,927 - INFO - Finished converting document 4_2024-12-20 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2024-11-26' --> 'data\processed_data\CRM\4_2024-11-26.md'


2025-11-14 16:09:33,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,158 - INFO - Going to convert document batch...
2025-11-14 16:09:33,159 - INFO - Processing document 4_2024-12-23
2025-11-14 16:09:33,228 - INFO - Finished converting document 4_2024-12-23 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2024-12-20' --> 'data\processed_data\CRM\4_2024-12-20.md'


2025-11-14 16:09:33,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,316 - INFO - Going to convert document batch...
2025-11-14 16:09:33,317 - INFO - Processing document 4_2024-12-26
2025-11-14 16:09:33,366 - INFO - Finished converting document 4_2024-12-26 in 0.08 sec.


Converted 'data\edgar_documents\CRM\4_2024-12-23' --> 'data\processed_data\CRM\4_2024-12-23.md'
Converted 'data\edgar_documents\CRM\4_2024-12-26' --> 'data\processed_data\CRM\4_2024-12-26.md'


2025-11-14 16:09:33,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,506 - INFO - Going to convert document batch...
2025-11-14 16:09:33,507 - INFO - Processing document 4_2024-12-27
2025-11-14 16:09:33,539 - INFO - Finished converting document 4_2024-12-27 in 0.08 sec.
2025-11-14 16:09:33,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,637 - INFO - Going to convert document batch...
2025-11-14 16:09:33,640 - INFO - Processing document 4_2025-01-03
2025-11-14 16:09:33,721 - INFO - Finished converting document 4_2025-01-03 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-12-27' --> 'data\processed_data\CRM\4_2024-12-27.md'
Converted 'data\edgar_documents\CRM\4_2025-01-03' --> 'data\processed_data\CRM\4_2025-01-03.md'


2025-11-14 16:09:33,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,840 - INFO - Going to convert document batch...
2025-11-14 16:09:33,841 - INFO - Processing document 4_2025-01-16
2025-11-14 16:09:33,886 - INFO - Finished converting document 4_2025-01-16 in 0.09 sec.
2025-11-14 16:09:33,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,978 - INFO - Going to convert document batch...
2025-11-14 16:09:33,979 - INFO - Processing document 4_2025-01-23
2025-11-14 16:09:34,039 - INFO - Finished converting document 4_2025-01-23 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-01-16' --> 'data\processed_data\CRM\4_2025-01-16.md'
Converted 'data\edgar_documents\CRM\4_2025-01-23' --> 'data\processed_data\CRM\4_2025-01-23.md'


2025-11-14 16:09:34,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,123 - INFO - Going to convert document batch...
2025-11-14 16:09:34,125 - INFO - Processing document 4_2025-02-03
2025-11-14 16:09:34,176 - INFO - Finished converting document 4_2025-02-03 in 0.09 sec.
2025-11-14 16:09:34,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,249 - INFO - Going to convert document batch...
2025-11-14 16:09:34,250 - INFO - Processing document 4_2025-02-04
2025-11-14 16:09:34,310 - INFO - Finished converting document 4_2025-02-04 in 0.09 sec.
2025-11-14 16:09:34,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,409 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-02-03' --> 'data\processed_data\CRM\4_2025-02-03.md'
Converted 'data\edgar_documents\CRM\4_2025-02-04' --> 'data\processed_data\CRM\4_2025-02-04.md'


2025-11-14 16:09:34,410 - INFO - Processing document 4_2025-02-19
2025-11-14 16:09:34,468 - INFO - Finished converting document 4_2025-02-19 in 0.11 sec.
2025-11-14 16:09:34,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,558 - INFO - Going to convert document batch...
2025-11-14 16:09:34,560 - INFO - Processing document 4_2025-02-24
2025-11-14 16:09:34,611 - INFO - Finished converting document 4_2025-02-24 in 0.09 sec.
2025-11-14 16:09:34,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,689 - INFO - Going to convert document batch...
2025-11-14 16:09:34,690 - INFO - Processing document 4_2025-02-25


Converted 'data\edgar_documents\CRM\4_2025-02-19' --> 'data\processed_data\CRM\4_2025-02-19.md'
Converted 'data\edgar_documents\CRM\4_2025-02-24' --> 'data\processed_data\CRM\4_2025-02-24.md'


2025-11-14 16:09:34,739 - INFO - Finished converting document 4_2025-02-25 in 0.08 sec.
2025-11-14 16:09:34,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,838 - INFO - Going to convert document batch...
2025-11-14 16:09:34,840 - INFO - Processing document 4_2025-02-26
2025-11-14 16:09:34,882 - INFO - Finished converting document 4_2025-02-26 in 0.08 sec.
2025-11-14 16:09:34,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,960 - INFO - Going to convert document batch...
2025-11-14 16:09:34,962 - INFO - Processing document 4_2025-03-03
2025-11-14 16:09:34,997 - INFO - Finished converting document 4_2025-03-03 in 0.08 sec.


Converted 'data\edgar_documents\CRM\4_2025-02-25' --> 'data\processed_data\CRM\4_2025-02-25.md'
Converted 'data\edgar_documents\CRM\4_2025-02-26' --> 'data\processed_data\CRM\4_2025-02-26.md'


2025-11-14 16:09:35,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:35,071 - INFO - Going to convert document batch...
2025-11-14 16:09:35,073 - INFO - Processing document 4_2025-03-04


Converted 'data\edgar_documents\CRM\4_2025-03-03' --> 'data\processed_data\CRM\4_2025-03-03.md'


2025-11-14 16:09:35,659 - INFO - Finished converting document 4_2025-03-04 in 0.62 sec.
2025-11-14 16:09:35,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:35,769 - INFO - Going to convert document batch...
2025-11-14 16:09:35,771 - INFO - Processing document 4_2025-03-17
2025-11-14 16:09:35,819 - INFO - Finished converting document 4_2025-03-17 in 0.09 sec.
2025-11-14 16:09:35,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:35,908 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-03-04' --> 'data\processed_data\CRM\4_2025-03-04.md'
Converted 'data\edgar_documents\CRM\4_2025-03-17' --> 'data\processed_data\CRM\4_2025-03-17.md'


2025-11-14 16:09:35,909 - INFO - Processing document 4_2025-03-18
2025-11-14 16:09:35,951 - INFO - Finished converting document 4_2025-03-18 in 0.09 sec.
2025-11-14 16:09:36,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,052 - INFO - Going to convert document batch...
2025-11-14 16:09:36,053 - INFO - Processing document 4_2025-03-25
2025-11-14 16:09:36,142 - INFO - Finished converting document 4_2025-03-25 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-03-18' --> 'data\processed_data\CRM\4_2025-03-18.md'


2025-11-14 16:09:36,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,244 - INFO - Going to convert document batch...
2025-11-14 16:09:36,245 - INFO - Processing document 4_2025-03-27
2025-11-14 16:09:36,304 - INFO - Finished converting document 4_2025-03-27 in 0.08 sec.
2025-11-14 16:09:36,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,386 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-03-25' --> 'data\processed_data\CRM\4_2025-03-25.md'
Converted 'data\edgar_documents\CRM\4_2025-03-27' --> 'data\processed_data\CRM\4_2025-03-27.md'


2025-11-14 16:09:36,387 - INFO - Processing document 4_2025-04-04
2025-11-14 16:09:36,422 - INFO - Finished converting document 4_2025-04-04 in 0.08 sec.
2025-11-14 16:09:36,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,496 - INFO - Going to convert document batch...
2025-11-14 16:09:36,497 - INFO - Processing document 4_2025-04-10
2025-11-14 16:09:36,544 - INFO - Finished converting document 4_2025-04-10 in 0.09 sec.
2025-11-14 16:09:36,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,647 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-04-04' --> 'data\processed_data\CRM\4_2025-04-04.md'
Converted 'data\edgar_documents\CRM\4_2025-04-10' --> 'data\processed_data\CRM\4_2025-04-10.md'


2025-11-14 16:09:36,649 - INFO - Processing document 4_2025-04-17
2025-11-14 16:09:36,711 - INFO - Finished converting document 4_2025-04-17 in 0.09 sec.
2025-11-14 16:09:36,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,820 - INFO - Going to convert document batch...
2025-11-14 16:09:36,821 - INFO - Processing document 4_2025-04-24
2025-11-14 16:09:36,889 - INFO - Finished converting document 4_2025-04-24 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-04-17' --> 'data\processed_data\CRM\4_2025-04-17.md'
Converted 'data\edgar_documents\CRM\4_2025-04-24' --> 'data\processed_data\CRM\4_2025-04-24.md'


2025-11-14 16:09:36,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,992 - INFO - Going to convert document batch...
2025-11-14 16:09:36,994 - INFO - Processing document 4_2025-05-05
2025-11-14 16:09:37,029 - INFO - Finished converting document 4_2025-05-05 in 0.09 sec.
2025-11-14 16:09:37,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:37,137 - INFO - Going to convert document batch...
2025-11-14 16:09:37,139 - INFO - Processing document 4_2025-05-15
2025-11-14 16:09:37,191 - INFO - Finished converting document 4_2025-05-15 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-05-05' --> 'data\processed_data\CRM\4_2025-05-05.md'
Converted 'data\edgar_documents\CRM\4_2025-05-15' --> 'data\processed_data\CRM\4_2025-05-15.md'


2025-11-14 16:09:37,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:37,313 - INFO - Going to convert document batch...
2025-11-14 16:09:37,316 - INFO - Processing document 4_2025-05-23
2025-11-14 16:09:37,389 - INFO - Finished converting document 4_2025-05-23 in 0.14 sec.
2025-11-14 16:09:37,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:37,520 - INFO - Going to convert document batch...
2025-11-14 16:09:37,522 - INFO - Processing document 4_2025-05-28
2025-11-14 16:09:37,594 - INFO - Finished converting document 4_2025-05-28 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-05-23' --> 'data\processed_data\CRM\4_2025-05-23.md'
Converted 'data\edgar_documents\CRM\4_2025-05-28' --> 'data\processed_data\CRM\4_2025-05-28.md'


2025-11-14 16:09:37,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:37,765 - INFO - Going to convert document batch...
2025-11-14 16:09:37,766 - INFO - Processing document 4_2025-06-24
2025-11-14 16:09:37,895 - INFO - Finished converting document 4_2025-06-24 in 0.22 sec.
2025-11-14 16:09:38,004 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:38,038 - INFO - Going to convert document batch...
2025-11-14 16:09:38,039 - INFO - Processing document 4_2025-07-01
2025-11-14 16:09:38,094 - INFO - Finished converting document 4_2025-07-01 in 0.11 sec.
2025-11-14 16:09:38,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-06-24' --> 'data\processed_data\CRM\4_2025-06-24.md'
Converted 'data\edgar_documents\CRM\4_2025-07-01' --> 'data\processed_data\CRM\4_2025-07-01.md'


2025-11-14 16:09:38,208 - INFO - Going to convert document batch...
2025-11-14 16:09:38,210 - INFO - Processing document 4_2025-07-03
2025-11-14 16:09:38,313 - INFO - Finished converting document 4_2025-07-03 in 0.16 sec.
2025-11-14 16:09:38,395 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:38,435 - INFO - Going to convert document batch...
2025-11-14 16:09:38,437 - INFO - Processing document 4_2025-07-07
2025-11-14 16:09:38,530 - INFO - Finished converting document 4_2025-07-07 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-03' --> 'data\processed_data\CRM\4_2025-07-03.md'


2025-11-14 16:09:38,648 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:38,676 - INFO - Going to convert document batch...
2025-11-14 16:09:38,677 - INFO - Processing document 4_2025-07-08
2025-11-14 16:09:38,757 - INFO - Finished converting document 4_2025-07-08 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-07' --> 'data\processed_data\CRM\4_2025-07-07.md'


2025-11-14 16:09:38,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:38,913 - INFO - Going to convert document batch...
2025-11-14 16:09:38,915 - INFO - Processing document 4_2025-07-09


Converted 'data\edgar_documents\CRM\4_2025-07-08' --> 'data\processed_data\CRM\4_2025-07-08.md'


2025-11-14 16:09:39,046 - INFO - Finished converting document 4_2025-07-09 in 0.22 sec.
2025-11-14 16:09:39,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:39,236 - INFO - Going to convert document batch...
2025-11-14 16:09:39,237 - INFO - Processing document 4_2025-07-10
2025-11-14 16:09:39,334 - INFO - Finished converting document 4_2025-07-10 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-09' --> 'data\processed_data\CRM\4_2025-07-09.md'


2025-11-14 16:09:39,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:39,471 - INFO - Going to convert document batch...
2025-11-14 16:09:39,472 - INFO - Processing document 4_2025-07-11
2025-11-14 16:09:39,564 - INFO - Finished converting document 4_2025-07-11 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-10' --> 'data\processed_data\CRM\4_2025-07-10.md'


2025-11-14 16:09:39,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:39,670 - INFO - Going to convert document batch...
2025-11-14 16:09:39,671 - INFO - Processing document 4_2025-07-14
2025-11-14 16:09:39,734 - INFO - Finished converting document 4_2025-07-14 in 0.11 sec.
2025-11-14 16:09:39,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-07-11' --> 'data\processed_data\CRM\4_2025-07-11.md'
Converted 'data\edgar_documents\CRM\4_2025-07-14' --> 'data\processed_data\CRM\4_2025-07-14.md'


2025-11-14 16:09:39,860 - INFO - Going to convert document batch...
2025-11-14 16:09:39,861 - INFO - Processing document 4_2025-07-15
2025-11-14 16:09:39,941 - INFO - Finished converting document 4_2025-07-15 in 0.14 sec.
2025-11-14 16:09:40,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,063 - INFO - Going to convert document batch...
2025-11-14 16:09:40,066 - INFO - Processing document 4_2025-07-16
2025-11-14 16:09:40,166 - INFO - Finished converting document 4_2025-07-16 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-15' --> 'data\processed_data\CRM\4_2025-07-15.md'


2025-11-14 16:09:40,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,388 - INFO - Going to convert document batch...
2025-11-14 16:09:40,390 - INFO - Processing document 4_2025-07-17
2025-11-14 16:09:40,485 - INFO - Finished converting document 4_2025-07-17 in 0.20 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-16' --> 'data\processed_data\CRM\4_2025-07-16.md'


2025-11-14 16:09:40,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,586 - INFO - Going to convert document batch...
2025-11-14 16:09:40,587 - INFO - Processing document 4_2025-07-18
2025-11-14 16:09:40,647 - INFO - Finished converting document 4_2025-07-18 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-17' --> 'data\processed_data\CRM\4_2025-07-17.md'
Converted 'data\edgar_documents\CRM\4_2025-07-18' --> 'data\processed_data\CRM\4_2025-07-18.md'


2025-11-14 16:09:40,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,762 - INFO - Going to convert document batch...
2025-11-14 16:09:40,763 - INFO - Processing document 4_2025-07-21
2025-11-14 16:09:40,852 - INFO - Finished converting document 4_2025-07-21 in 0.14 sec.
2025-11-14 16:09:40,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,972 - INFO - Going to convert document batch...
2025-11-14 16:09:40,973 - INFO - Processing document 4_2025-07-22
2025-11-14 16:09:41,053 - INFO - Finished converting document 4_2025-07-22 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-21' --> 'data\processed_data\CRM\4_2025-07-21.md'


2025-11-14 16:09:41,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,155 - INFO - Going to convert document batch...
2025-11-14 16:09:41,156 - INFO - Processing document 4_2025-07-23
2025-11-14 16:09:41,211 - INFO - Finished converting document 4_2025-07-23 in 0.08 sec.
2025-11-14 16:09:41,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,319 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-07-22' --> 'data\processed_data\CRM\4_2025-07-22.md'
Converted 'data\edgar_documents\CRM\4_2025-07-23' --> 'data\processed_data\CRM\4_2025-07-23.md'


2025-11-14 16:09:41,321 - INFO - Processing document 4_2025-07-24
2025-11-14 16:09:41,401 - INFO - Finished converting document 4_2025-07-24 in 0.14 sec.
2025-11-14 16:09:41,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,529 - INFO - Going to convert document batch...
2025-11-14 16:09:41,530 - INFO - Processing document 4_2025-07-25
2025-11-14 16:09:41,584 - INFO - Finished converting document 4_2025-07-25 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-24' --> 'data\processed_data\CRM\4_2025-07-24.md'
Converted 'data\edgar_documents\CRM\4_2025-07-25' --> 'data\processed_data\CRM\4_2025-07-25.md'


2025-11-14 16:09:41,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,716 - INFO - Going to convert document batch...
2025-11-14 16:09:41,720 - INFO - Processing document 4_2025-07-28
2025-11-14 16:09:41,786 - INFO - Finished converting document 4_2025-07-28 in 0.14 sec.
2025-11-14 16:09:41,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,888 - INFO - Going to convert document batch...
2025-11-14 16:09:41,889 - INFO - Processing document 4_2025-07-29
2025-11-14 16:09:41,969 - INFO - Finished converting document 4_2025-07-29 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-28' --> 'data\processed_data\CRM\4_2025-07-28.md'
Converted 'data\edgar_documents\CRM\4_2025-07-29' --> 'data\processed_data\CRM\4_2025-07-29.md'


2025-11-14 16:09:42,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:42,105 - INFO - Going to convert document batch...
2025-11-14 16:09:42,106 - INFO - Processing document 4_2025-07-30
2025-11-14 16:09:42,201 - INFO - Finished converting document 4_2025-07-30 in 0.16 sec.
2025-11-14 16:09:42,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:42,343 - INFO - Going to convert document batch...
2025-11-14 16:09:42,344 - INFO - Processing document 4_2025-07-31
2025-11-14 16:09:42,436 - INFO - Finished converting document 4_2025-07-31 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-30' --> 'data\processed_data\CRM\4_2025-07-30.md'


2025-11-14 16:09:42,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:42,566 - INFO - Going to convert document batch...
2025-11-14 16:09:42,567 - INFO - Processing document 4_2025-08-01
2025-11-14 16:09:42,639 - INFO - Finished converting document 4_2025-08-01 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-31' --> 'data\processed_data\CRM\4_2025-07-31.md'


2025-11-14 16:09:42,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:42,786 - INFO - Going to convert document batch...
2025-11-14 16:09:42,787 - INFO - Processing document 4_2025-08-04


Converted 'data\edgar_documents\CRM\4_2025-08-01' --> 'data\processed_data\CRM\4_2025-08-01.md'


2025-11-14 16:09:43,434 - INFO - Finished converting document 4_2025-08-04 in 0.70 sec.
2025-11-14 16:09:43,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:43,544 - INFO - Going to convert document batch...
2025-11-14 16:09:43,545 - INFO - Processing document 4_2025-08-05
2025-11-14 16:09:43,604 - INFO - Finished converting document 4_2025-08-05 in 0.11 sec.
2025-11-14 16:09:43,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-08-04' --> 'data\processed_data\CRM\4_2025-08-04.md'
Converted 'data\edgar_documents\CRM\4_2025-08-05' --> 'data\processed_data\CRM\4_2025-08-05.md'


2025-11-14 16:09:43,711 - INFO - Going to convert document batch...
2025-11-14 16:09:43,714 - INFO - Processing document 4_2025-08-06
2025-11-14 16:09:43,803 - INFO - Finished converting document 4_2025-08-06 in 0.14 sec.
2025-11-14 16:09:43,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:43,967 - INFO - Going to convert document batch...
2025-11-14 16:09:43,968 - INFO - Processing document 4_2025-08-07
2025-11-14 16:09:44,044 - INFO - Finished converting document 4_2025-08-07 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-06' --> 'data\processed_data\CRM\4_2025-08-06.md'


2025-11-14 16:09:44,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:44,299 - INFO - Going to convert document batch...
2025-11-14 16:09:44,303 - INFO - Processing document 4_2025-08-08


Converted 'data\edgar_documents\CRM\4_2025-08-07' --> 'data\processed_data\CRM\4_2025-08-07.md'


2025-11-14 16:09:44,488 - INFO - Finished converting document 4_2025-08-08 in 0.36 sec.
2025-11-14 16:09:44,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:44,634 - INFO - Going to convert document batch...
2025-11-14 16:09:44,636 - INFO - Processing document 4_2025-08-11
2025-11-14 16:09:44,737 - INFO - Finished converting document 4_2025-08-11 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-08' --> 'data\processed_data\CRM\4_2025-08-08.md'


2025-11-14 16:09:44,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:44,939 - INFO - Going to convert document batch...
2025-11-14 16:09:44,941 - INFO - Processing document 4_2025-08-12


Converted 'data\edgar_documents\CRM\4_2025-08-11' --> 'data\processed_data\CRM\4_2025-08-11.md'


2025-11-14 16:09:45,090 - INFO - Finished converting document 4_2025-08-12 in 0.25 sec.
2025-11-14 16:09:45,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:45,274 - INFO - Going to convert document batch...
2025-11-14 16:09:45,276 - INFO - Processing document 4_2025-08-13
2025-11-14 16:09:45,361 - INFO - Finished converting document 4_2025-08-13 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-12' --> 'data\processed_data\CRM\4_2025-08-12.md'


2025-11-14 16:09:45,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:45,596 - INFO - Going to convert document batch...
2025-11-14 16:09:45,601 - INFO - Processing document 4_2025-08-14


Converted 'data\edgar_documents\CRM\4_2025-08-13' --> 'data\processed_data\CRM\4_2025-08-13.md'


2025-11-14 16:09:45,736 - INFO - Finished converting document 4_2025-08-14 in 0.26 sec.
2025-11-14 16:09:45,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:45,847 - INFO - Going to convert document batch...
2025-11-14 16:09:45,849 - INFO - Processing document 4_2025-08-15
2025-11-14 16:09:45,916 - INFO - Finished converting document 4_2025-08-15 in 0.12 sec.
2025-11-14 16:09:46,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-08-14' --> 'data\processed_data\CRM\4_2025-08-14.md'
Converted 'data\edgar_documents\CRM\4_2025-08-15' --> 'data\processed_data\CRM\4_2025-08-15.md'


2025-11-14 16:09:46,050 - INFO - Going to convert document batch...
2025-11-14 16:09:46,052 - INFO - Processing document 4_2025-08-18
2025-11-14 16:09:46,288 - INFO - Finished converting document 4_2025-08-18 in 0.31 sec.
2025-11-14 16:09:46,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:46,467 - INFO - Going to convert document batch...
2025-11-14 16:09:46,469 - INFO - Processing document 4_2025-08-19
2025-11-14 16:09:46,586 - INFO - Finished converting document 4_2025-08-19 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-18' --> 'data\processed_data\CRM\4_2025-08-18.md'


2025-11-14 16:09:46,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:46,754 - INFO - Going to convert document batch...
2025-11-14 16:09:46,756 - INFO - Processing document 4_2025-08-20
2025-11-14 16:09:46,835 - INFO - Finished converting document 4_2025-08-20 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-19' --> 'data\processed_data\CRM\4_2025-08-19.md'


2025-11-14 16:09:46,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:46,975 - INFO - Going to convert document batch...
2025-11-14 16:09:46,977 - INFO - Processing document 4_2025-08-21
2025-11-14 16:09:47,052 - INFO - Finished converting document 4_2025-08-21 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-20' --> 'data\processed_data\CRM\4_2025-08-20.md'
Converted 'data\edgar_documents\CRM\4_2025-08-21' --> 'data\processed_data\CRM\4_2025-08-21.md'


2025-11-14 16:09:47,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:47,198 - INFO - Going to convert document batch...
2025-11-14 16:09:47,200 - INFO - Processing document 4_2025-08-22
2025-11-14 16:09:47,305 - INFO - Finished converting document 4_2025-08-22 in 0.19 sec.
2025-11-14 16:09:47,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:47,421 - INFO - Going to convert document batch...
2025-11-14 16:09:47,422 - INFO - Processing document 4_2025-08-25
2025-11-14 16:09:47,462 - INFO - Finished converting document 4_2025-08-25 in 0.08 sec.
2025-11-14 16:09:47,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:47,555 - INFO - Going to convert document batch...
2025-11-14 16:09:47,556 - INFO - Processing document 4_2025-08-26


Converted 'data\edgar_documents\CRM\4_2025-08-22' --> 'data\processed_data\CRM\4_2025-08-22.md'
Converted 'data\edgar_documents\CRM\4_2025-08-25' --> 'data\processed_data\CRM\4_2025-08-25.md'


2025-11-14 16:09:47,666 - INFO - Finished converting document 4_2025-08-26 in 0.17 sec.
2025-11-14 16:09:47,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:47,820 - INFO - Going to convert document batch...
2025-11-14 16:09:47,822 - INFO - Processing document 4_2025-08-27
2025-11-14 16:09:47,923 - INFO - Finished converting document 4_2025-08-27 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-26' --> 'data\processed_data\CRM\4_2025-08-26.md'


2025-11-14 16:09:48,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:48,057 - INFO - Going to convert document batch...
2025-11-14 16:09:48,059 - INFO - Processing document 4_2025-08-28
2025-11-14 16:09:48,154 - INFO - Finished converting document 4_2025-08-28 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-27' --> 'data\processed_data\CRM\4_2025-08-27.md'


2025-11-14 16:09:48,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:48,322 - INFO - Going to convert document batch...
2025-11-14 16:09:48,324 - INFO - Processing document 4_2025-08-29
2025-11-14 16:09:48,393 - INFO - Finished converting document 4_2025-08-29 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-28' --> 'data\processed_data\CRM\4_2025-08-28.md'


2025-11-14 16:09:48,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:48,550 - INFO - Going to convert document batch...
2025-11-14 16:09:48,553 - INFO - Processing document 4_2025-09-02


Converted 'data\edgar_documents\CRM\4_2025-08-29' --> 'data\processed_data\CRM\4_2025-08-29.md'


2025-11-14 16:09:48,718 - INFO - Finished converting document 4_2025-09-02 in 0.25 sec.
2025-11-14 16:09:48,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:48,865 - INFO - Going to convert document batch...
2025-11-14 16:09:48,867 - INFO - Processing document 4_2025-09-03


Converted 'data\edgar_documents\CRM\4_2025-09-02' --> 'data\processed_data\CRM\4_2025-09-02.md'


2025-11-14 16:09:48,993 - INFO - Finished converting document 4_2025-09-03 in 0.20 sec.
2025-11-14 16:09:49,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:49,166 - INFO - Going to convert document batch...
2025-11-14 16:09:49,167 - INFO - Processing document 4_2025-09-04
2025-11-14 16:09:49,290 - INFO - Finished converting document 4_2025-09-04 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-03' --> 'data\processed_data\CRM\4_2025-09-03.md'


2025-11-14 16:09:49,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:49,460 - INFO - Going to convert document batch...
2025-11-14 16:09:49,462 - INFO - Processing document 4_2025-09-05
2025-11-14 16:09:49,587 - INFO - Finished converting document 4_2025-09-05 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-04' --> 'data\processed_data\CRM\4_2025-09-04.md'


2025-11-14 16:09:49,667 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:49,711 - INFO - Going to convert document batch...
2025-11-14 16:09:49,713 - INFO - Processing document 4_2025-09-08
2025-11-14 16:09:49,825 - INFO - Finished converting document 4_2025-09-08 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-05' --> 'data\processed_data\CRM\4_2025-09-05.md'


2025-11-14 16:09:49,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:49,986 - INFO - Going to convert document batch...
2025-11-14 16:09:49,987 - INFO - Processing document 4_2025-09-09
2025-11-14 16:09:50,100 - INFO - Finished converting document 4_2025-09-09 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-08' --> 'data\processed_data\CRM\4_2025-09-08.md'


2025-11-14 16:09:50,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:50,244 - INFO - Going to convert document batch...
2025-11-14 16:09:50,245 - INFO - Processing document 4_2025-09-10
2025-11-14 16:09:50,306 - INFO - Finished converting document 4_2025-09-10 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-09' --> 'data\processed_data\CRM\4_2025-09-09.md'
Converted 'data\edgar_documents\CRM\4_2025-09-10' --> 'data\processed_data\CRM\4_2025-09-10.md'


2025-11-14 16:09:50,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:50,473 - INFO - Going to convert document batch...
2025-11-14 16:09:50,475 - INFO - Processing document 4_2025-09-11
2025-11-14 16:09:50,599 - INFO - Finished converting document 4_2025-09-11 in 0.24 sec.
2025-11-14 16:09:50,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:50,702 - INFO - Going to convert document batch...
2025-11-14 16:09:50,703 - INFO - Processing document 4_2025-09-12
2025-11-14 16:09:50,769 - INFO - Finished converting document 4_2025-09-12 in 0.11 sec.
2025-11-14 16:09:50,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-09-11' --> 'data\processed_data\CRM\4_2025-09-11.md'
Converted 'data\edgar_documents\CRM\4_2025-09-12' --> 'data\processed_data\CRM\4_2025-09-12.md'


2025-11-14 16:09:50,899 - INFO - Going to convert document batch...
2025-11-14 16:09:50,901 - INFO - Processing document 4_2025-09-15
2025-11-14 16:09:51,011 - INFO - Finished converting document 4_2025-09-15 in 0.19 sec.
2025-11-14 16:09:51,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-09-15' --> 'data\processed_data\CRM\4_2025-09-15.md'


2025-11-14 16:09:51,630 - INFO - Going to convert document batch...
2025-11-14 16:09:51,632 - INFO - Processing document 4_2025-09-16
2025-11-14 16:09:51,702 - INFO - Finished converting document 4_2025-09-16 in 0.59 sec.
2025-11-14 16:09:51,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:51,818 - INFO - Going to convert document batch...
2025-11-14 16:09:51,819 - INFO - Processing document 4_2025-09-17
2025-11-14 16:09:51,902 - INFO - Finished converting document 4_2025-09-17 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-16' --> 'data\processed_data\CRM\4_2025-09-16.md'


2025-11-14 16:09:51,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:52,006 - INFO - Going to convert document batch...
2025-11-14 16:09:52,008 - INFO - Processing document 4_2025-09-18
2025-11-14 16:09:52,071 - INFO - Finished converting document 4_2025-09-18 in 0.09 sec.
2025-11-14 16:09:52,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-09-17' --> 'data\processed_data\CRM\4_2025-09-17.md'
Converted 'data\edgar_documents\CRM\4_2025-09-18' --> 'data\processed_data\CRM\4_2025-09-18.md'


2025-11-14 16:09:52,187 - INFO - Going to convert document batch...
2025-11-14 16:09:52,188 - INFO - Processing document 4_2025-09-19
2025-11-14 16:09:52,282 - INFO - Finished converting document 4_2025-09-19 in 0.14 sec.
2025-11-14 16:09:52,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:52,438 - INFO - Going to convert document batch...
2025-11-14 16:09:52,439 - INFO - Processing document 4_2025-09-22
2025-11-14 16:09:52,539 - INFO - Finished converting document 4_2025-09-22 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-19' --> 'data\processed_data\CRM\4_2025-09-19.md'


2025-11-14 16:09:52,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:52,669 - INFO - Going to convert document batch...
2025-11-14 16:09:52,671 - INFO - Processing document 4_2025-09-23
2025-11-14 16:09:52,748 - INFO - Finished converting document 4_2025-09-23 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-22' --> 'data\processed_data\CRM\4_2025-09-22.md'
Converted 'data\edgar_documents\CRM\4_2025-09-23' --> 'data\processed_data\CRM\4_2025-09-23.md'


2025-11-14 16:09:52,826 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:52,860 - INFO - Going to convert document batch...
2025-11-14 16:09:52,861 - INFO - Processing document 4_2025-09-24
2025-11-14 16:09:52,931 - INFO - Finished converting document 4_2025-09-24 in 0.12 sec.
2025-11-14 16:09:53,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,132 - INFO - Going to convert document batch...
2025-11-14 16:09:53,133 - INFO - Processing document 4_2025-09-25


Converted 'data\edgar_documents\CRM\4_2025-09-24' --> 'data\processed_data\CRM\4_2025-09-24.md'


2025-11-14 16:09:53,226 - INFO - Finished converting document 4_2025-09-25 in 0.20 sec.
2025-11-14 16:09:53,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,339 - INFO - Going to convert document batch...
2025-11-14 16:09:53,340 - INFO - Processing document 4_2025-09-26
2025-11-14 16:09:53,418 - INFO - Finished converting document 4_2025-09-26 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-25' --> 'data\processed_data\CRM\4_2025-09-25.md'
Converted 'data\edgar_documents\CRM\4_2025-09-26' --> 'data\processed_data\CRM\4_2025-09-26.md'


2025-11-14 16:09:53,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,534 - INFO - Going to convert document batch...
2025-11-14 16:09:53,535 - INFO - Processing document 4_2025-09-29
2025-11-14 16:09:53,612 - INFO - Finished converting document 4_2025-09-29 in 0.14 sec.
2025-11-14 16:09:53,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,770 - INFO - Going to convert document batch...
2025-11-14 16:09:53,771 - INFO - Processing document 4_2025-09-30
2025-11-14 16:09:53,863 - INFO - Finished converting document 4_2025-09-30 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-29' --> 'data\processed_data\CRM\4_2025-09-29.md'
Converted 'data\edgar_documents\CRM\4_2025-09-30' --> 'data\processed_data\CRM\4_2025-09-30.md'


2025-11-14 16:09:53,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,982 - INFO - Going to convert document batch...
2025-11-14 16:09:53,984 - INFO - Processing document 4_2025-10-01
2025-11-14 16:09:54,094 - INFO - Finished converting document 4_2025-10-01 in 0.19 sec.
2025-11-14 16:09:54,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:54,211 - INFO - Going to convert document batch...
2025-11-14 16:09:54,212 - INFO - Processing document 4_2025-10-02
2025-11-14 16:09:54,323 - INFO - Finished converting document 4_2025-10-02 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-01' --> 'data\processed_data\CRM\4_2025-10-01.md'


2025-11-14 16:09:54,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:54,457 - INFO - Going to convert document batch...
2025-11-14 16:09:54,459 - INFO - Processing document 4_2025-10-03
2025-11-14 16:09:54,533 - INFO - Finished converting document 4_2025-10-03 in 0.11 sec.
2025-11-14 16:09:54,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-10-02' --> 'data\processed_data\CRM\4_2025-10-02.md'
Converted 'data\edgar_documents\CRM\4_2025-10-03' --> 'data\processed_data\CRM\4_2025-10-03.md'


2025-11-14 16:09:54,644 - INFO - Going to convert document batch...
2025-11-14 16:09:54,645 - INFO - Processing document 4_2025-10-06
2025-11-14 16:09:54,706 - INFO - Finished converting document 4_2025-10-06 in 0.11 sec.
2025-11-14 16:09:54,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:54,933 - INFO - Going to convert document batch...
2025-11-14 16:09:54,934 - INFO - Processing document 4_2025-10-07
2025-11-14 16:09:55,026 - INFO - Finished converting document 4_2025-10-07 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-06' --> 'data\processed_data\CRM\4_2025-10-06.md'


2025-11-14 16:09:55,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:55,215 - INFO - Going to convert document batch...
2025-11-14 16:09:55,217 - INFO - Processing document 4_2025-10-08


Converted 'data\edgar_documents\CRM\4_2025-10-07' --> 'data\processed_data\CRM\4_2025-10-07.md'


2025-11-14 16:09:55,366 - INFO - Finished converting document 4_2025-10-08 in 0.22 sec.
2025-11-14 16:09:55,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:55,644 - INFO - Going to convert document batch...
2025-11-14 16:09:55,645 - INFO - Processing document 4_2025-10-09


Converted 'data\edgar_documents\CRM\4_2025-10-08' --> 'data\processed_data\CRM\4_2025-10-08.md'


2025-11-14 16:09:55,721 - INFO - Finished converting document 4_2025-10-09 in 0.20 sec.
2025-11-14 16:09:55,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:55,843 - INFO - Going to convert document batch...
2025-11-14 16:09:55,844 - INFO - Processing document 4_2025-10-10
2025-11-14 16:09:55,911 - INFO - Finished converting document 4_2025-10-10 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-09' --> 'data\processed_data\CRM\4_2025-10-09.md'
Converted 'data\edgar_documents\CRM\4_2025-10-10' --> 'data\processed_data\CRM\4_2025-10-10.md'


2025-11-14 16:09:56,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:56,053 - INFO - Going to convert document batch...
2025-11-14 16:09:56,054 - INFO - Processing document 4_2025-10-14
2025-11-14 16:09:56,196 - INFO - Finished converting document 4_2025-10-14 in 0.20 sec.
2025-11-14 16:09:56,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:56,335 - INFO - Going to convert document batch...
2025-11-14 16:09:56,336 - INFO - Processing document 4_2025-10-15
2025-11-14 16:09:56,436 - INFO - Finished converting document 4_2025-10-15 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-14' --> 'data\processed_data\CRM\4_2025-10-14.md'


2025-11-14 16:09:56,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:56,622 - INFO - Going to convert document batch...
2025-11-14 16:09:56,623 - INFO - Processing document 4_2025-10-16
2025-11-14 16:09:56,700 - INFO - Finished converting document 4_2025-10-16 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-15' --> 'data\processed_data\CRM\4_2025-10-15.md'


2025-11-14 16:09:56,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:56,807 - INFO - Going to convert document batch...
2025-11-14 16:09:56,809 - INFO - Processing document 4_2025-10-17
2025-11-14 16:09:56,891 - INFO - Finished converting document 4_2025-10-17 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-16' --> 'data\processed_data\CRM\4_2025-10-16.md'


2025-11-14 16:09:57,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:57,045 - INFO - Going to convert document batch...
2025-11-14 16:09:57,046 - INFO - Processing document 4_2025-10-20
2025-11-14 16:09:57,136 - INFO - Finished converting document 4_2025-10-20 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-17' --> 'data\processed_data\CRM\4_2025-10-17.md'


2025-11-14 16:09:57,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:57,261 - INFO - Going to convert document batch...
2025-11-14 16:09:57,262 - INFO - Processing document 4_2025-10-21
2025-11-14 16:09:57,354 - INFO - Finished converting document 4_2025-10-21 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-20' --> 'data\processed_data\CRM\4_2025-10-20.md'
Converted 'data\edgar_documents\CRM\4_2025-10-21' --> 'data\processed_data\CRM\4_2025-10-21.md'


2025-11-14 16:09:57,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:57,497 - INFO - Going to convert document batch...
2025-11-14 16:09:57,498 - INFO - Processing document 4_2025-10-22
2025-11-14 16:09:57,673 - INFO - Finished converting document 4_2025-10-22 in 0.25 sec.
2025-11-14 16:09:57,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:57,811 - INFO - Going to convert document batch...
2025-11-14 16:09:57,813 - INFO - Processing document 4_2025-10-23
2025-11-14 16:09:57,878 - INFO - Finished converting document 4_2025-10-23 in 0.12 sec.
2025-11-14 16:09:57,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-10-22' --> 'data\processed_data\CRM\4_2025-10-22.md'
Converted 'data\edgar_documents\CRM\4_2025-10-23' --> 'data\processed_data\CRM\4_2025-10-23.md'


2025-11-14 16:09:58,482 - INFO - Going to convert document batch...
2025-11-14 16:09:58,484 - INFO - Processing document 4_2025-10-24
2025-11-14 16:09:58,577 - INFO - Finished converting document 4_2025-10-24 in 0.66 sec.
2025-11-14 16:09:58,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:58,690 - INFO - Going to convert document batch...
2025-11-14 16:09:58,692 - INFO - Processing document 4_2025-10-27
2025-11-14 16:09:58,788 - INFO - Finished converting document 4_2025-10-27 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-24' --> 'data\processed_data\CRM\4_2025-10-24.md'


2025-11-14 16:09:58,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:58,932 - INFO - Going to convert document batch...
2025-11-14 16:09:58,934 - INFO - Processing document 4_2025-10-28


Converted 'data\edgar_documents\CRM\4_2025-10-27' --> 'data\processed_data\CRM\4_2025-10-27.md'


2025-11-14 16:09:59,084 - INFO - Finished converting document 4_2025-10-28 in 0.22 sec.
2025-11-14 16:09:59,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:59,196 - INFO - Going to convert document batch...
2025-11-14 16:09:59,198 - INFO - Processing document 4_2025-10-29
2025-11-14 16:09:59,263 - INFO - Finished converting document 4_2025-10-29 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-28' --> 'data\processed_data\CRM\4_2025-10-28.md'
Converted 'data\edgar_documents\CRM\4_2025-10-29' --> 'data\processed_data\CRM\4_2025-10-29.md'


2025-11-14 16:09:59,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:59,392 - INFO - Going to convert document batch...
2025-11-14 16:09:59,394 - INFO - Processing document 4_2025-10-30
2025-11-14 16:09:59,484 - INFO - Finished converting document 4_2025-10-30 in 0.16 sec.
2025-11-14 16:09:59,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:59,592 - INFO - Going to convert document batch...
2025-11-14 16:09:59,594 - INFO - Processing document 4_2025-10-31
2025-11-14 16:09:59,680 - INFO - Finished converting document 4_2025-10-31 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-30' --> 'data\processed_data\CRM\4_2025-10-30.md'


2025-11-14 16:09:59,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:59,852 - INFO - Going to convert document batch...
2025-11-14 16:09:59,853 - INFO - Processing document 4_2025-11-03
2025-11-14 16:09:59,956 - INFO - Finished converting document 4_2025-11-03 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-31' --> 'data\processed_data\CRM\4_2025-10-31.md'


2025-11-14 16:10:00,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,072 - INFO - Going to convert document batch...
2025-11-14 16:10:00,074 - INFO - Processing document 4_2025-11-04
2025-11-14 16:10:00,138 - INFO - Finished converting document 4_2025-11-04 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-11-03' --> 'data\processed_data\CRM\4_2025-11-03.md'
Converted 'data\edgar_documents\CRM\4_2025-11-04' --> 'data\processed_data\CRM\4_2025-11-04.md'


2025-11-14 16:10:00,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,282 - INFO - Going to convert document batch...
2025-11-14 16:10:00,283 - INFO - Processing document 8-K_2023-01-04
2025-11-14 16:10:00,331 - INFO - Finished converting document 8-K_2023-01-04 in 0.12 sec.
2025-11-14 16:10:00,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,389 - INFO - Going to convert document batch...
2025-11-14 16:10:00,391 - INFO - Processing document 8-K_2023-01-27
2025-11-14 16:10:00,434 - INFO - Finished converting document 8-K_2023-01-27 in 0.09 sec.
2025-11-14 16:10:00,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,516 - INFO - Going to convert document batch...
2025-11-14 16:10:00,517 - INFO - Processing document 8-K_2023-03-01
2025-11-14 16:10:00,550 - INFO - Finished converting document 8-K_2023-03-01 in 0.09 sec.


Converted 'data\edgar_documents\CRM\8-K_2023-01-04' --> 'data\processed_data\CRM\8-K_2023-01-04.md'
Converted 'data\edgar_documents\CRM\8-K_2023-01-27' --> 'data\processed_data\CRM\8-K_2023-01-27.md'


2025-11-14 16:10:00,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,609 - INFO - Going to convert document batch...
2025-11-14 16:10:00,610 - INFO - Processing document 8-K_2023-05-31
2025-11-14 16:10:00,650 - INFO - Finished converting document 8-K_2023-05-31 in 0.08 sec.
2025-11-14 16:10:00,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\8-K_2023-03-01' --> 'data\processed_data\CRM\8-K_2023-03-01.md'
Converted 'data\edgar_documents\CRM\8-K_2023-05-31' --> 'data\processed_data\CRM\8-K_2023-05-31.md'


2025-11-14 16:10:00,793 - INFO - Going to convert document batch...
2025-11-14 16:10:00,794 - INFO - Processing document 8-K_2023-06-12
2025-11-14 16:10:00,884 - INFO - Finished converting document 8-K_2023-06-12 in 0.20 sec.
2025-11-14 16:10:00,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,010 - INFO - Going to convert document batch...
2025-11-14 16:10:01,012 - INFO - Processing document 8-K_2023-08-30
2025-11-14 16:10:01,051 - INFO - Finished converting document 8-K_2023-08-30 in 0.12 sec.
2025-11-14 16:10:01,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\8-K_2023-06-12' --> 'data\processed_data\CRM\8-K_2023-06-12.md'
Converted 'data\edgar_documents\CRM\8-K_2023-08-30' --> 'data\processed_data\CRM\8-K_2023-08-30.md'


2025-11-14 16:10:01,121 - INFO - Going to convert document batch...
2025-11-14 16:10:01,123 - INFO - Processing document 8-K_2023-11-29
2025-11-14 16:10:01,164 - INFO - Finished converting document 8-K_2023-11-29 in 0.09 sec.
2025-11-14 16:10:01,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,214 - INFO - Going to convert document batch...
2025-11-14 16:10:01,215 - INFO - Processing document 8-K_2024-02-28
2025-11-14 16:10:01,249 - INFO - Finished converting document 8-K_2024-02-28 in 0.06 sec.
2025-11-14 16:10:01,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,332 - INFO - Going to convert document batch...
2025-11-14 16:10:01,334 - INFO - Processing document 8-K_2024-05-29
2025-11-14 16:10:01,379 - INFO - Finished converting document 8-K_2024-05-29 in 0.09 sec.


Converted 'data\edgar_documents\CRM\8-K_2023-11-29' --> 'data\processed_data\CRM\8-K_2023-11-29.md'
Converted 'data\edgar_documents\CRM\8-K_2024-02-28' --> 'data\processed_data\CRM\8-K_2024-02-28.md'


2025-11-14 16:10:01,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,488 - INFO - Going to convert document batch...
2025-11-14 16:10:01,490 - INFO - Processing document 8-K_2024-07-01


Converted 'data\edgar_documents\CRM\8-K_2024-05-29' --> 'data\processed_data\CRM\8-K_2024-05-29.md'


2025-11-14 16:10:01,612 - INFO - Finished converting document 8-K_2024-07-01 in 0.20 sec.
2025-11-14 16:10:01,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,705 - INFO - Going to convert document batch...
2025-11-14 16:10:01,707 - INFO - Processing document 8-K_2024-08-28
2025-11-14 16:10:01,784 - INFO - Finished converting document 8-K_2024-08-28 in 0.11 sec.
2025-11-14 16:10:01,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\8-K_2024-07-01' --> 'data\processed_data\CRM\8-K_2024-07-01.md'
Converted 'data\edgar_documents\CRM\8-K_2024-08-28' --> 'data\processed_data\CRM\8-K_2024-08-28.md'


2025-11-14 16:10:01,861 - INFO - Going to convert document batch...
2025-11-14 16:10:01,862 - INFO - Processing document 8-K_2024-09-05
2025-11-14 16:10:01,903 - INFO - Finished converting document 8-K_2024-09-05 in 0.09 sec.
2025-11-14 16:10:01,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,965 - INFO - Going to convert document batch...
2025-11-14 16:10:01,966 - INFO - Processing document 8-K_2024-11-05
2025-11-14 16:10:02,001 - INFO - Finished converting document 8-K_2024-11-05 in 0.08 sec.
2025-11-14 16:10:02,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,094 - INFO - Going to convert document batch...
2025-11-14 16:10:02,095 - INFO - Processing document 8-K_2024-12-03


Converted 'data\edgar_documents\CRM\8-K_2024-09-05' --> 'data\processed_data\CRM\8-K_2024-09-05.md'
Converted 'data\edgar_documents\CRM\8-K_2024-11-05' --> 'data\processed_data\CRM\8-K_2024-11-05.md'


2025-11-14 16:10:02,135 - INFO - Finished converting document 8-K_2024-12-03 in 0.11 sec.
2025-11-14 16:10:02,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,192 - INFO - Going to convert document batch...
2025-11-14 16:10:02,193 - INFO - Processing document 8-K_2024-12-10
2025-11-14 16:10:02,232 - INFO - Finished converting document 8-K_2024-12-10 in 0.08 sec.
2025-11-14 16:10:02,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,306 - INFO - Going to convert document batch...
2025-11-14 16:10:02,310 - INFO - Processing document 8-K_2025-02-05
2025-11-14 16:10:02,347 - INFO - Finished converting document 8-K_2025-02-05 in 0.09 sec.


Converted 'data\edgar_documents\CRM\8-K_2024-12-03' --> 'data\processed_data\CRM\8-K_2024-12-03.md'
Converted 'data\edgar_documents\CRM\8-K_2024-12-10' --> 'data\processed_data\CRM\8-K_2024-12-10.md'


2025-11-14 16:10:02,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,413 - INFO - Going to convert document batch...
2025-11-14 16:10:02,414 - INFO - Processing document 8-K_2025-02-26
2025-11-14 16:10:02,463 - INFO - Finished converting document 8-K_2025-02-26 in 0.09 sec.
2025-11-14 16:10:02,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,541 - INFO - Going to convert document batch...
2025-11-14 16:10:02,542 - INFO - Processing document 8-K_2025-05-27
2025-11-14 16:10:02,570 - INFO - Finished converting document 8-K_2025-05-27 in 0.06 sec.


Converted 'data\edgar_documents\CRM\8-K_2025-02-05' --> 'data\processed_data\CRM\8-K_2025-02-05.md'
Converted 'data\edgar_documents\CRM\8-K_2025-02-26' --> 'data\processed_data\CRM\8-K_2025-02-26.md'


2025-11-14 16:10:02,605 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,625 - INFO - Going to convert document batch...
2025-11-14 16:10:02,626 - INFO - Processing document 8-K_2025-05-28
2025-11-14 16:10:02,659 - INFO - Finished converting document 8-K_2025-05-28 in 0.08 sec.
2025-11-14 16:10:02,698 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,738 - INFO - Going to convert document batch...
2025-11-14 16:10:02,740 - INFO - Processing document 8-K_2025-06-09


Converted 'data\edgar_documents\CRM\8-K_2025-05-27' --> 'data\processed_data\CRM\8-K_2025-05-27.md'
Converted 'data\edgar_documents\CRM\8-K_2025-05-28' --> 'data\processed_data\CRM\8-K_2025-05-28.md'


2025-11-14 16:10:02,828 - INFO - Finished converting document 8-K_2025-06-09 in 0.14 sec.
2025-11-14 16:10:02,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,911 - INFO - Going to convert document batch...
2025-11-14 16:10:02,912 - INFO - Processing document 8-K_2025-06-24
2025-11-14 16:10:02,950 - INFO - Finished converting document 8-K_2025-06-24 in 0.09 sec.
2025-11-14 16:10:02,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:03,022 - INFO - Going to convert document batch...
2025-11-14 16:10:03,023 - INFO - Processing document 8-K_2025-07-09


Converted 'data\edgar_documents\CRM\8-K_2025-06-09' --> 'data\processed_data\CRM\8-K_2025-06-09.md'
Converted 'data\edgar_documents\CRM\8-K_2025-06-24' --> 'data\processed_data\CRM\8-K_2025-06-24.md'


2025-11-14 16:10:03,059 - INFO - Finished converting document 8-K_2025-07-09 in 0.09 sec.
2025-11-14 16:10:03,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:03,148 - INFO - Going to convert document batch...
2025-11-14 16:10:03,151 - INFO - Processing document 8-K_2025-09-03
2025-11-14 16:10:03,232 - INFO - Finished converting document 8-K_2025-09-03 in 0.14 sec.
2025-11-14 16:10:03,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\8-K_2025-07-09' --> 'data\processed_data\CRM\8-K_2025-07-09.md'
Converted 'data\edgar_documents\CRM\8-K_2025-09-03' --> 'data\processed_data\CRM\8-K_2025-09-03.md'


2025-11-14 16:10:03,330 - INFO - Going to convert document batch...
2025-11-14 16:10:03,331 - INFO - Processing document 8-K_2025-10-16
2025-11-14 16:10:03,389 - INFO - Finished converting document 8-K_2025-10-16 in 0.14 sec.
2025-11-14 16:10:03,465 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:10:03,466 - ERROR - Input document DEF-14A_2023-04-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:10:03,469 - INFO - Going to convert 

Converted 'data\edgar_documents\CRM\8-K_2025-10-16' --> 'data\processed_data\CRM\8-K_2025-10-16.md'
Error processing data\edgar_documents\CRM\DEF-14A_2023-04-27: File format not allowed: data\edgar_documents\CRM\DEF-14A_2023-04-27
Error processing data\edgar_documents\CRM\DEF-14A_2024-05-16: File format not allowed: data\edgar_documents\CRM\DEF-14A_2024-05-16


2025-11-14 16:10:03,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:05,898 - INFO - Going to convert document batch...
2025-11-14 16:10:05,900 - INFO - Processing document DEF-14A_2025-04-24
2025-11-14 16:10:50,592 - INFO - Finished converting document DEF-14A_2025-04-24 in 47.06 sec.
2025-11-14 16:10:52,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\DEF-14A_2025-04-24' --> 'data\processed_data\CRM\DEF-14A_2025-04-24.md'
Processed 509 new files. Errors: 2
Found 128 files to process in data\edgar_documents\CSCO


2025-11-14 16:10:53,216 - INFO - Going to convert document batch...
2025-11-14 16:10:53,218 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:10:53,218 - INFO - Processing document 10-K_2023-09-07
2025-11-14 16:10:55,011 - INFO - Finished converting document 10-K_2023-09-07 in 2.86 sec.
2025-11-14 16:10:55,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-K_2023-09-07' --> 'data\processed_data\CSCO\10-K_2023-09-07.md'


2025-11-14 16:10:56,617 - INFO - Going to convert document batch...
2025-11-14 16:10:56,618 - INFO - Processing document 10-K_2024-09-05
2025-11-14 16:10:58,499 - INFO - Finished converting document 10-K_2024-09-05 in 2.91 sec.
2025-11-14 16:10:59,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-K_2024-09-05' --> 'data\processed_data\CSCO\10-K_2024-09-05.md'


2025-11-14 16:11:00,380 - INFO - Going to convert document batch...
2025-11-14 16:11:00,380 - INFO - Processing document 10-K_2025-09-03
2025-11-14 16:11:02,250 - INFO - Finished converting document 10-K_2025-09-03 in 3.09 sec.
2025-11-14 16:11:02,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-K_2025-09-03' --> 'data\processed_data\CSCO\10-K_2025-09-03.md'


2025-11-14 16:11:03,523 - INFO - Going to convert document batch...
2025-11-14 16:11:03,524 - INFO - Processing document 10-Q_2023-02-21
2025-11-14 16:11:05,454 - INFO - Finished converting document 10-Q_2023-02-21 in 2.59 sec.
2025-11-14 16:11:06,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2023-02-21' --> 'data\processed_data\CSCO\10-Q_2023-02-21.md'


2025-11-14 16:11:06,671 - INFO - Going to convert document batch...
2025-11-14 16:11:06,672 - INFO - Processing document 10-Q_2023-05-24
2025-11-14 16:11:08,187 - INFO - Finished converting document 10-Q_2023-05-24 in 2.17 sec.
2025-11-14 16:11:08,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2023-05-24' --> 'data\processed_data\CSCO\10-Q_2023-05-24.md'


2025-11-14 16:11:09,807 - INFO - Going to convert document batch...
2025-11-14 16:11:09,808 - INFO - Processing document 10-Q_2023-11-21
2025-11-14 16:11:11,031 - INFO - Finished converting document 10-Q_2023-11-21 in 2.25 sec.
2025-11-14 16:11:11,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2023-11-21' --> 'data\processed_data\CSCO\10-Q_2023-11-21.md'


2025-11-14 16:11:12,499 - INFO - Going to convert document batch...
2025-11-14 16:11:12,500 - INFO - Processing document 10-Q_2024-02-20
2025-11-14 16:11:15,895 - INFO - Finished converting document 10-Q_2024-02-20 in 4.42 sec.
2025-11-14 16:11:17,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2024-02-20' --> 'data\processed_data\CSCO\10-Q_2024-02-20.md'


2025-11-14 16:11:20,243 - INFO - Going to convert document batch...
2025-11-14 16:11:20,245 - INFO - Processing document 10-Q_2024-05-21
2025-11-14 16:11:24,307 - INFO - Finished converting document 10-Q_2024-05-21 in 7.05 sec.
2025-11-14 16:11:25,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2024-05-21' --> 'data\processed_data\CSCO\10-Q_2024-05-21.md'


2025-11-14 16:11:26,925 - INFO - Going to convert document batch...
2025-11-14 16:11:26,927 - INFO - Processing document 10-Q_2024-11-19
2025-11-14 16:11:29,859 - INFO - Finished converting document 10-Q_2024-11-19 in 4.09 sec.
2025-11-14 16:11:31,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2024-11-19' --> 'data\processed_data\CSCO\10-Q_2024-11-19.md'


2025-11-14 16:11:33,735 - INFO - Going to convert document batch...
2025-11-14 16:11:33,737 - INFO - Processing document 10-Q_2025-02-18
2025-11-14 16:11:37,528 - INFO - Finished converting document 10-Q_2025-02-18 in 5.62 sec.
2025-11-14 16:11:39,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2025-02-18' --> 'data\processed_data\CSCO\10-Q_2025-02-18.md'


2025-11-14 16:11:40,919 - INFO - Going to convert document batch...
2025-11-14 16:11:40,920 - INFO - Processing document 10-Q_2025-05-20
2025-11-14 16:11:44,629 - INFO - Finished converting document 10-Q_2025-05-20 in 5.22 sec.
2025-11-14 16:11:46,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,004 - INFO - Going to convert document batch...
2025-11-14 16:11:47,006 - INFO - Processing document 4_2023-02-14
2025-11-14 16:11:47,059 - INFO - Finished converting document 4_2023-02-14 in 0.11 sec.


Converted 'data\edgar_documents\CSCO\10-Q_2025-05-20' --> 'data\processed_data\CSCO\10-Q_2025-05-20.md'
Converted 'data\edgar_documents\CSCO\4_2023-02-14' --> 'data\processed_data\CSCO\4_2023-02-14.md'


2025-11-14 16:11:47,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,177 - INFO - Going to convert document batch...
2025-11-14 16:11:47,179 - INFO - Processing document 4_2023-02-22
2025-11-14 16:11:47,234 - INFO - Finished converting document 4_2023-02-22 in 0.11 sec.
2025-11-14 16:11:47,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,339 - INFO - Going to convert document batch...
2025-11-14 16:11:47,341 - INFO - Processing document 4_2023-02-24
2025-11-14 16:11:47,405 - INFO - Finished converting document 4_2023-02-24 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2023-02-22' --> 'data\processed_data\CSCO\4_2023-02-22.md'
Converted 'data\edgar_documents\CSCO\4_2023-02-24' --> 'data\processed_data\CSCO\4_2023-02-24.md'


2025-11-14 16:11:47,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,533 - INFO - Going to convert document batch...
2025-11-14 16:11:47,536 - INFO - Processing document 4_2023-03-14
2025-11-14 16:11:47,602 - INFO - Finished converting document 4_2023-03-14 in 0.12 sec.
2025-11-14 16:11:47,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,690 - INFO - Going to convert document batch...
2025-11-14 16:11:47,691 - INFO - Processing document 4_2023-03-17
2025-11-14 16:11:47,753 - INFO - Finished converting document 4_2023-03-17 in 0.09 sec.
2025-11-14 16:11:47,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2023-03-14' --> 'data\processed_data\CSCO\4_2023-03-14.md'
Converted 'data\edgar_documents\CSCO\4_2023-03-17' --> 'data\processed_data\CSCO\4_2023-03-17.md'


2025-11-14 16:11:47,857 - INFO - Going to convert document batch...
2025-11-14 16:11:47,861 - INFO - Processing document 4_2023-05-12
2025-11-14 16:11:47,924 - INFO - Finished converting document 4_2023-05-12 in 0.12 sec.
2025-11-14 16:11:48,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,030 - INFO - Going to convert document batch...
2025-11-14 16:11:48,031 - INFO - Processing document 4_2023-05-23
2025-11-14 16:11:48,086 - INFO - Finished converting document 4_2023-05-23 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\4_2023-05-12' --> 'data\processed_data\CSCO\4_2023-05-12.md'
Converted 'data\edgar_documents\CSCO\4_2023-05-23' --> 'data\processed_data\CSCO\4_2023-05-23.md'


2025-11-14 16:11:48,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,218 - INFO - Going to convert document batch...
2025-11-14 16:11:48,220 - INFO - Processing document 4_2023-06-08
2025-11-14 16:11:48,256 - INFO - Finished converting document 4_2023-06-08 in 0.09 sec.
2025-11-14 16:11:48,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,362 - INFO - Going to convert document batch...
2025-11-14 16:11:48,365 - INFO - Processing document 4_2023-06-13
2025-11-14 16:11:48,422 - INFO - Finished converting document 4_2023-06-13 in 0.11 sec.


Converted 'data\edgar_documents\CSCO\4_2023-06-08' --> 'data\processed_data\CSCO\4_2023-06-08.md'
Converted 'data\edgar_documents\CSCO\4_2023-06-13' --> 'data\processed_data\CSCO\4_2023-06-13.md'


2025-11-14 16:11:48,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,545 - INFO - Going to convert document batch...
2025-11-14 16:11:48,547 - INFO - Processing document 4_2023-06-14
2025-11-14 16:11:48,605 - INFO - Finished converting document 4_2023-06-14 in 0.14 sec.
2025-11-14 16:11:48,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,691 - INFO - Going to convert document batch...
2025-11-14 16:11:48,693 - INFO - Processing document 4_2023-06-16
2025-11-14 16:11:48,727 - INFO - Finished converting document 4_2023-06-16 in 0.06 sec.
2025-11-14 16:11:48,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,821 - INFO - Going to convert document batch...
2025-11-14 16:11:48,823 - INFO - Processing document 4_2023-06-23


Converted 'data\edgar_documents\CSCO\4_2023-06-14' --> 'data\processed_data\CSCO\4_2023-06-14.md'
Converted 'data\edgar_documents\CSCO\4_2023-06-16' --> 'data\processed_data\CSCO\4_2023-06-16.md'


2025-11-14 16:11:48,862 - INFO - Finished converting document 4_2023-06-23 in 0.09 sec.
2025-11-14 16:11:48,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,957 - INFO - Going to convert document batch...
2025-11-14 16:11:48,958 - INFO - Processing document 4_2023-08-14
2025-11-14 16:11:48,999 - INFO - Finished converting document 4_2023-08-14 in 0.08 sec.
2025-11-14 16:11:49,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,094 - INFO - Going to convert document batch...
2025-11-14 16:11:49,096 - INFO - Processing document 4_2023-08-22


Converted 'data\edgar_documents\CSCO\4_2023-06-23' --> 'data\processed_data\CSCO\4_2023-06-23.md'
Converted 'data\edgar_documents\CSCO\4_2023-08-14' --> 'data\processed_data\CSCO\4_2023-08-14.md'


2025-11-14 16:11:49,144 - INFO - Finished converting document 4_2023-08-22 in 0.11 sec.
2025-11-14 16:11:49,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,321 - INFO - Going to convert document batch...
2025-11-14 16:11:49,324 - INFO - Processing document 4_2023-08-23
2025-11-14 16:11:49,407 - INFO - Finished converting document 4_2023-08-23 in 0.19 sec.


Converted 'data\edgar_documents\CSCO\4_2023-08-22' --> 'data\processed_data\CSCO\4_2023-08-22.md'


2025-11-14 16:11:49,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,468 - INFO - Going to convert document batch...
2025-11-14 16:11:49,470 - INFO - Processing document 4_2023-09-12
2025-11-14 16:11:49,493 - INFO - Finished converting document 4_2023-09-12 in 0.05 sec.
2025-11-14 16:11:49,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,599 - INFO - Going to convert document batch...
2025-11-14 16:11:49,601 - INFO - Processing document 4_2023-09-14
2025-11-14 16:11:49,642 - INFO - Finished converting document 4_2023-09-14 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\4_2023-08-23' --> 'data\processed_data\CSCO\4_2023-08-23.md'
Converted 'data\edgar_documents\CSCO\4_2023-09-12' --> 'data\processed_data\CSCO\4_2023-09-12.md'


2025-11-14 16:11:49,727 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,761 - INFO - Going to convert document batch...
2025-11-14 16:11:49,764 - INFO - Processing document 4_2023-09-19
2025-11-14 16:11:49,814 - INFO - Finished converting document 4_2023-09-19 in 0.11 sec.
2025-11-14 16:11:49,878 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:11:49,880 - ERROR - Input document 4_2023-09-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:11

Converted 'data\edgar_documents\CSCO\4_2023-09-14' --> 'data\processed_data\CSCO\4_2023-09-14.md'
Converted 'data\edgar_documents\CSCO\4_2023-09-19' --> 'data\processed_data\CSCO\4_2023-09-19.md'
Error processing data\edgar_documents\CSCO\4_2023-09-21: File format not allowed: data\edgar_documents\CSCO\4_2023-09-21


2025-11-14 16:11:49,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,947 - INFO - Going to convert document batch...
2025-11-14 16:11:49,950 - INFO - Processing document 4_2023-09-25
2025-11-14 16:11:49,994 - INFO - Finished converting document 4_2023-09-25 in 0.12 sec.
2025-11-14 16:11:50,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,055 - INFO - Going to convert document batch...
2025-11-14 16:11:50,055 - INFO - Processing document 4_2023-10-12
2025-11-14 16:11:50,088 - INFO - Finished converting document 4_2023-10-12 in 0.05 sec.
2025-11-14 16:11:50,176 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,204 - INFO - Going to convert document batch...
2025-11-14 16:11:50,206 - INFO - Processing document 4_2023-11-14
2025-11-14 16:11:50,261 - INFO - Finished converting document 4_2023-11-14 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2023-09-25' --> 'data\processed_data\CSCO\4_2023-09-25.md'
Converted 'data\edgar_documents\CSCO\4_2023-10-12' --> 'data\processed_data\CSCO\4_2023-10-12.md'


2025-11-14 16:11:50,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,359 - INFO - Going to convert document batch...
2025-11-14 16:11:50,360 - INFO - Processing document 4_2023-11-21
2025-11-14 16:11:50,399 - INFO - Finished converting document 4_2023-11-21 in 0.06 sec.
2025-11-14 16:11:50,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2023-11-14' --> 'data\processed_data\CSCO\4_2023-11-14.md'
Converted 'data\edgar_documents\CSCO\4_2023-11-21' --> 'data\processed_data\CSCO\4_2023-11-21.md'


2025-11-14 16:11:50,526 - INFO - Going to convert document batch...
2025-11-14 16:11:50,529 - INFO - Processing document 4_2023-11-30
2025-11-14 16:11:50,606 - INFO - Finished converting document 4_2023-11-30 in 0.16 sec.
2025-11-14 16:11:50,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,707 - INFO - Going to convert document batch...
2025-11-14 16:11:50,708 - INFO - Processing document 4_2023-12-08
2025-11-14 16:11:50,778 - INFO - Finished converting document 4_2023-12-08 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2023-11-30' --> 'data\processed_data\CSCO\4_2023-11-30.md'
Converted 'data\edgar_documents\CSCO\4_2023-12-08' --> 'data\processed_data\CSCO\4_2023-12-08.md'


2025-11-14 16:11:50,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,911 - INFO - Going to convert document batch...
2025-11-14 16:11:50,913 - INFO - Processing document 4_2023-12-12
2025-11-14 16:11:50,968 - INFO - Finished converting document 4_2023-12-12 in 0.12 sec.
2025-11-14 16:11:51,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,044 - INFO - Going to convert document batch...
2025-11-14 16:11:51,045 - INFO - Processing document 4_2023-12-15
2025-11-14 16:11:51,101 - INFO - Finished converting document 4_2023-12-15 in 0.09 sec.
2025-11-14 16:11:51,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2023-12-12' --> 'data\processed_data\CSCO\4_2023-12-12.md'
Converted 'data\edgar_documents\CSCO\4_2023-12-15' --> 'data\processed_data\CSCO\4_2023-12-15.md'


2025-11-14 16:11:51,201 - INFO - Going to convert document batch...
2025-11-14 16:11:51,203 - INFO - Processing document 4_2023-12-18
2025-11-14 16:11:51,274 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.
2025-11-14 16:11:51,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,339 - INFO - Going to convert document batch...
2025-11-14 16:11:51,341 - INFO - Processing document 4_2024-02-13
2025-11-14 16:11:51,387 - INFO - Finished converting document 4_2024-02-13 in 0.08 sec.
2025-11-14 16:11:51,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,492 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\4_2023-12-18' --> 'data\processed_data\CSCO\4_2023-12-18.md'
Converted 'data\edgar_documents\CSCO\4_2024-02-13' --> 'data\processed_data\CSCO\4_2024-02-13.md'


2025-11-14 16:11:51,495 - INFO - Processing document 4_2024-02-21
2025-11-14 16:11:51,541 - INFO - Finished converting document 4_2024-02-21 in 0.09 sec.
2025-11-14 16:11:51,623 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:11:51,624 - ERROR - Input document 4_2024-02-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:11:51,627 - INFO - Going to convert document batch...
2025-11-14 16:11:51,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11

Converted 'data\edgar_documents\CSCO\4_2024-02-21' --> 'data\processed_data\CSCO\4_2024-02-21.md'
Error processing data\edgar_documents\CSCO\4_2024-02-22: File format not allowed: data\edgar_documents\CSCO\4_2024-02-22
Converted 'data\edgar_documents\CSCO\4_2024-03-07' --> 'data\processed_data\CSCO\4_2024-03-07.md'


2025-11-14 16:11:51,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,819 - INFO - Going to convert document batch...
2025-11-14 16:11:51,822 - INFO - Processing document 4_2024-03-12
2025-11-14 16:11:51,871 - INFO - Finished converting document 4_2024-03-12 in 0.11 sec.
2025-11-14 16:11:51,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,972 - INFO - Going to convert document batch...
2025-11-14 16:11:51,974 - INFO - Processing document 4_2024-03-14
2025-11-14 16:11:52,029 - INFO - Finished converting document 4_2024-03-14 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2024-03-12' --> 'data\processed_data\CSCO\4_2024-03-12.md'
Converted 'data\edgar_documents\CSCO\4_2024-03-14' --> 'data\processed_data\CSCO\4_2024-03-14.md'


2025-11-14 16:11:52,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,123 - INFO - Going to convert document batch...
2025-11-14 16:11:52,124 - INFO - Processing document 4_2024-03-19
2025-11-14 16:11:52,175 - INFO - Finished converting document 4_2024-03-19 in 0.11 sec.
2025-11-14 16:11:52,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,256 - INFO - Going to convert document batch...
2025-11-14 16:11:52,257 - INFO - Processing document 4_2024-05-14
2025-11-14 16:11:52,297 - INFO - Finished converting document 4_2024-05-14 in 0.08 sec.
2025-11-14 16:11:52,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,391 - INFO - Going to convert document batch...
2025-11-14 16:11:52,393 - INFO - Processing document 4_2024-05-21


Converted 'data\edgar_documents\CSCO\4_2024-03-19' --> 'data\processed_data\CSCO\4_2024-03-19.md'
Converted 'data\edgar_documents\CSCO\4_2024-05-14' --> 'data\processed_data\CSCO\4_2024-05-14.md'


2025-11-14 16:11:52,452 - INFO - Finished converting document 4_2024-05-21 in 0.11 sec.
2025-11-14 16:11:52,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,534 - INFO - Going to convert document batch...
2025-11-14 16:11:52,535 - INFO - Processing document 4_2024-05-31
2025-11-14 16:11:52,578 - INFO - Finished converting document 4_2024-05-31 in 0.08 sec.
2025-11-14 16:11:52,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,660 - INFO - Going to convert document batch...
2025-11-14 16:11:52,661 - INFO - Processing document 4_2024-06-12


Converted 'data\edgar_documents\CSCO\4_2024-05-21' --> 'data\processed_data\CSCO\4_2024-05-21.md'
Converted 'data\edgar_documents\CSCO\4_2024-05-31' --> 'data\processed_data\CSCO\4_2024-05-31.md'


2025-11-14 16:11:52,719 - INFO - Finished converting document 4_2024-06-12 in 0.11 sec.
2025-11-14 16:11:52,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,847 - INFO - Going to convert document batch...
2025-11-14 16:11:52,850 - INFO - Processing document 4_2024-06-14
2025-11-14 16:11:52,889 - INFO - Finished converting document 4_2024-06-14 in 0.08 sec.
2025-11-14 16:11:52,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,982 - INFO - Going to convert document batch...
2025-11-14 16:11:52,984 - INFO - Processing document 4_2024-06-18


Converted 'data\edgar_documents\CSCO\4_2024-06-12' --> 'data\processed_data\CSCO\4_2024-06-12.md'
Converted 'data\edgar_documents\CSCO\4_2024-06-14' --> 'data\processed_data\CSCO\4_2024-06-14.md'


2025-11-14 16:11:53,038 - INFO - Finished converting document 4_2024-06-18 in 0.09 sec.
2025-11-14 16:11:53,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,147 - INFO - Going to convert document batch...
2025-11-14 16:11:53,149 - INFO - Processing document 4_2024-08-13
2025-11-14 16:11:53,204 - INFO - Finished converting document 4_2024-08-13 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\4_2024-06-18' --> 'data\processed_data\CSCO\4_2024-06-18.md'
Converted 'data\edgar_documents\CSCO\4_2024-08-13' --> 'data\processed_data\CSCO\4_2024-08-13.md'


2025-11-14 16:11:53,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,321 - INFO - Going to convert document batch...
2025-11-14 16:11:53,324 - INFO - Processing document 4_2024-08-20
2025-11-14 16:11:53,395 - INFO - Finished converting document 4_2024-08-20 in 0.12 sec.
2025-11-14 16:11:53,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,495 - INFO - Going to convert document batch...
2025-11-14 16:11:53,497 - INFO - Processing document 4_2024-08-22
2025-11-14 16:11:53,555 - INFO - Finished converting document 4_2024-08-22 in 0.09 sec.
2025-11-14 16:11:53,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2024-08-20' --> 'data\processed_data\CSCO\4_2024-08-20.md'
Converted 'data\edgar_documents\CSCO\4_2024-08-22' --> 'data\processed_data\CSCO\4_2024-08-22.md'


2025-11-14 16:11:53,655 - INFO - Going to convert document batch...
2025-11-14 16:11:53,656 - INFO - Processing document 4_2024-08-28
2025-11-14 16:11:53,692 - INFO - Finished converting document 4_2024-08-28 in 0.08 sec.
2025-11-14 16:11:53,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,807 - INFO - Going to convert document batch...
2025-11-14 16:11:53,809 - INFO - Processing document 4_2024-09-12
2025-11-14 16:11:53,857 - INFO - Finished converting document 4_2024-09-12 in 0.09 sec.
2025-11-14 16:11:53,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,942 - INFO - Going to convert document batch...
2025-11-14 16:11:53,944 - INFO - Processing document 4_2024-09-18


Converted 'data\edgar_documents\CSCO\4_2024-08-28' --> 'data\processed_data\CSCO\4_2024-08-28.md'
Converted 'data\edgar_documents\CSCO\4_2024-09-12' --> 'data\processed_data\CSCO\4_2024-09-12.md'


2025-11-14 16:11:54,006 - INFO - Finished converting document 4_2024-09-18 in 0.11 sec.
2025-11-14 16:11:54,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,123 - INFO - Going to convert document batch...
2025-11-14 16:11:54,125 - INFO - Processing document 4_2024-09-23
2025-11-14 16:11:54,175 - INFO - Finished converting document 4_2024-09-23 in 0.11 sec.
2025-11-14 16:11:54,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,245 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\4_2024-09-18' --> 'data\processed_data\CSCO\4_2024-09-18.md'
Converted 'data\edgar_documents\CSCO\4_2024-09-23' --> 'data\processed_data\CSCO\4_2024-09-23.md'


2025-11-14 16:11:54,246 - INFO - Processing document 4_2024-11-06
2025-11-14 16:11:54,321 - INFO - Finished converting document 4_2024-11-06 in 0.09 sec.
2025-11-14 16:11:54,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,396 - INFO - Going to convert document batch...
2025-11-14 16:11:54,397 - INFO - Processing document 4_2024-11-13
2025-11-14 16:11:54,439 - INFO - Finished converting document 4_2024-11-13 in 0.08 sec.
2025-11-14 16:11:54,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,529 - INFO - Going to convert document batch...
2025-11-14 16:11:54,531 - INFO - Processing document 4_2024-11-19


Converted 'data\edgar_documents\CSCO\4_2024-11-06' --> 'data\processed_data\CSCO\4_2024-11-06.md'
Converted 'data\edgar_documents\CSCO\4_2024-11-13' --> 'data\processed_data\CSCO\4_2024-11-13.md'


2025-11-14 16:11:54,587 - INFO - Finished converting document 4_2024-11-19 in 0.11 sec.
2025-11-14 16:11:54,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,693 - INFO - Going to convert document batch...
2025-11-14 16:11:54,695 - INFO - Processing document 4_2024-11-21
2025-11-14 16:11:54,749 - INFO - Finished converting document 4_2024-11-21 in 0.11 sec.
2025-11-14 16:11:54,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2024-11-19' --> 'data\processed_data\CSCO\4_2024-11-19.md'
Converted 'data\edgar_documents\CSCO\4_2024-11-21' --> 'data\processed_data\CSCO\4_2024-11-21.md'


2025-11-14 16:11:54,864 - INFO - Going to convert document batch...
2025-11-14 16:11:54,866 - INFO - Processing document 4_2024-12-02
2025-11-14 16:11:54,908 - INFO - Finished converting document 4_2024-12-02 in 0.09 sec.
2025-11-14 16:11:54,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,977 - INFO - Going to convert document batch...
2025-11-14 16:11:54,977 - INFO - Processing document 4_2024-12-06
2025-11-14 16:11:55,006 - INFO - Finished converting document 4_2024-12-06 in 0.06 sec.
2025-11-14 16:11:55,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:55,096 - INFO - Going to convert document batch...
2025-11-14 16:11:55,098 - INFO - Processing document 4_2024-12-11


Converted 'data\edgar_documents\CSCO\4_2024-12-02' --> 'data\processed_data\CSCO\4_2024-12-02.md'
Converted 'data\edgar_documents\CSCO\4_2024-12-06' --> 'data\processed_data\CSCO\4_2024-12-06.md'


2025-11-14 16:11:55,160 - INFO - Finished converting document 4_2024-12-11 in 0.12 sec.
2025-11-14 16:11:55,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:55,268 - INFO - Going to convert document batch...
2025-11-14 16:11:55,269 - INFO - Processing document 4_2024-12-12
2025-11-14 16:11:55,311 - INFO - Finished converting document 4_2024-12-12 in 0.09 sec.
2025-11-14 16:11:55,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2024-12-11' --> 'data\processed_data\CSCO\4_2024-12-11.md'
Converted 'data\edgar_documents\CSCO\4_2024-12-12' --> 'data\processed_data\CSCO\4_2024-12-12.md'


2025-11-14 16:11:55,407 - INFO - Going to convert document batch...
2025-11-14 16:11:55,410 - INFO - Processing document 4_2025-02-12
2025-11-14 16:11:55,469 - INFO - Finished converting document 4_2025-02-12 in 0.11 sec.
2025-11-14 16:11:55,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:55,572 - INFO - Going to convert document batch...
2025-11-14 16:11:55,573 - INFO - Processing document 4_2025-02-18
2025-11-14 16:11:55,627 - INFO - Finished converting document 4_2025-02-18 in 0.11 sec.


Converted 'data\edgar_documents\CSCO\4_2025-02-12' --> 'data\processed_data\CSCO\4_2025-02-12.md'
Converted 'data\edgar_documents\CSCO\4_2025-02-18' --> 'data\processed_data\CSCO\4_2025-02-18.md'


2025-11-14 16:11:55,698 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:11:55,700 - ERROR - Input document 4_2025-02-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:11:55,703 - INFO - Going to convert document batch...
2025-11-14 16:11:55,736 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:11:55,739 - ERROR - Input document 4_2025-02-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\CSCO\4_2025-02-19: File format not allowed: data\edgar_documents\CSCO\4_2025-02-19
Error processing data\edgar_documents\CSCO\4_2025-02-21: File format not allowed: data\edgar_documents\CSCO\4_2025-02-21


2025-11-14 16:11:55,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:55,956 - INFO - Going to convert document batch...
2025-11-14 16:11:55,957 - INFO - Processing document 4_2025-02-27
2025-11-14 16:11:55,990 - INFO - Finished converting document 4_2025-02-27 in 0.06 sec.
2025-11-14 16:11:56,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,083 - INFO - Going to convert document batch...
2025-11-14 16:11:56,085 - INFO - Processing document 4_2025-03-12


Converted 'data\edgar_documents\CSCO\4_2025-02-24' --> 'data\processed_data\CSCO\4_2025-02-24.md'
Converted 'data\edgar_documents\CSCO\4_2025-02-27' --> 'data\processed_data\CSCO\4_2025-02-27.md'


2025-11-14 16:11:56,147 - INFO - Finished converting document 4_2025-03-12 in 0.12 sec.
2025-11-14 16:11:56,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,247 - INFO - Going to convert document batch...
2025-11-14 16:11:56,251 - INFO - Processing document 4_2025-03-18
2025-11-14 16:11:56,321 - INFO - Finished converting document 4_2025-03-18 in 0.09 sec.
2025-11-14 16:11:56,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2025-03-12' --> 'data\processed_data\CSCO\4_2025-03-12.md'
Converted 'data\edgar_documents\CSCO\4_2025-03-18' --> 'data\processed_data\CSCO\4_2025-03-18.md'


2025-11-14 16:11:56,431 - INFO - Going to convert document batch...
2025-11-14 16:11:56,434 - INFO - Processing document 4_2025-05-13
2025-11-14 16:11:56,492 - INFO - Finished converting document 4_2025-05-13 in 0.09 sec.
2025-11-14 16:11:56,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,571 - INFO - Going to convert document batch...
2025-11-14 16:11:56,575 - INFO - Processing document 4_2025-05-20
2025-11-14 16:11:56,635 - INFO - Finished converting document 4_2025-05-20 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\4_2025-05-13' --> 'data\processed_data\CSCO\4_2025-05-13.md'
Converted 'data\edgar_documents\CSCO\4_2025-05-20' --> 'data\processed_data\CSCO\4_2025-05-20.md'


2025-11-14 16:11:56,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,748 - INFO - Going to convert document batch...
2025-11-14 16:11:56,750 - INFO - Processing document 4_2025-05-29
2025-11-14 16:11:56,787 - INFO - Finished converting document 4_2025-05-29 in 0.08 sec.
2025-11-14 16:11:56,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,884 - INFO - Going to convert document batch...
2025-11-14 16:11:56,886 - INFO - Processing document 4_2025-06-06
2025-11-14 16:11:56,943 - INFO - Finished converting document 4_2025-06-06 in 0.09 sec.
2025-11-14 16:11:57,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2025-05-29' --> 'data\processed_data\CSCO\4_2025-05-29.md'
Converted 'data\edgar_documents\CSCO\4_2025-06-06' --> 'data\processed_data\CSCO\4_2025-06-06.md'


2025-11-14 16:11:57,041 - INFO - Going to convert document batch...
2025-11-14 16:11:57,045 - INFO - Processing document 4_2025-06-09
2025-11-14 16:11:57,100 - INFO - Finished converting document 4_2025-06-09 in 0.09 sec.
2025-11-14 16:11:57,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,215 - INFO - Going to convert document batch...
2025-11-14 16:11:57,216 - INFO - Processing document 4_2025-06-12
2025-11-14 16:11:57,290 - INFO - Finished converting document 4_2025-06-12 in 0.11 sec.
2025-11-14 16:11:57,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2025-06-09' --> 'data\processed_data\CSCO\4_2025-06-09.md'
Converted 'data\edgar_documents\CSCO\4_2025-06-12' --> 'data\processed_data\CSCO\4_2025-06-12.md'


2025-11-14 16:11:57,381 - INFO - Going to convert document batch...
2025-11-14 16:11:57,383 - INFO - Processing document 4_2025-06-18
2025-11-14 16:11:57,432 - INFO - Finished converting document 4_2025-06-18 in 0.11 sec.
2025-11-14 16:11:57,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,513 - INFO - Going to convert document batch...
2025-11-14 16:11:57,514 - INFO - Processing document 4_2025-06-20
2025-11-14 16:11:57,569 - INFO - Finished converting document 4_2025-06-20 in 0.09 sec.
2025-11-14 16:11:57,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,649 - INFO - Going to convert document batch...
2025-11-14 16:11:57,650 - INFO - Processing document 4_2025-07-14


Converted 'data\edgar_documents\CSCO\4_2025-06-18' --> 'data\processed_data\CSCO\4_2025-06-18.md'
Converted 'data\edgar_documents\CSCO\4_2025-06-20' --> 'data\processed_data\CSCO\4_2025-06-20.md'


2025-11-14 16:11:57,686 - INFO - Finished converting document 4_2025-07-14 in 0.08 sec.
2025-11-14 16:11:57,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,772 - INFO - Going to convert document batch...
2025-11-14 16:11:57,773 - INFO - Processing document 4_2025-08-12
2025-11-14 16:11:57,838 - INFO - Finished converting document 4_2025-08-12 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2025-07-14' --> 'data\processed_data\CSCO\4_2025-07-14.md'
Converted 'data\edgar_documents\CSCO\4_2025-08-12' --> 'data\processed_data\CSCO\4_2025-08-12.md'


2025-11-14 16:11:57,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,963 - INFO - Going to convert document batch...
2025-11-14 16:11:57,965 - INFO - Processing document 4_2025-08-19
2025-11-14 16:11:58,038 - INFO - Finished converting document 4_2025-08-19 in 0.12 sec.
2025-11-14 16:11:58,124 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,142 - INFO - Going to convert document batch...
2025-11-14 16:11:58,144 - INFO - Processing document 4_2025-08-20
2025-11-14 16:11:58,189 - INFO - Finished converting document 4_2025-08-20 in 0.08 sec.


Converted 'data\edgar_documents\CSCO\4_2025-08-19' --> 'data\processed_data\CSCO\4_2025-08-19.md'
Converted 'data\edgar_documents\CSCO\4_2025-08-20' --> 'data\processed_data\CSCO\4_2025-08-20.md'


2025-11-14 16:11:58,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,337 - INFO - Going to convert document batch...
2025-11-14 16:11:58,339 - INFO - Processing document 4_2025-08-27
2025-11-14 16:11:58,405 - INFO - Finished converting document 4_2025-08-27 in 0.12 sec.
2025-11-14 16:11:58,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,506 - INFO - Going to convert document batch...
2025-11-14 16:11:58,507 - INFO - Processing document 4_2025-09-11
2025-11-14 16:11:58,558 - INFO - Finished converting document 4_2025-09-11 in 0.09 sec.
2025-11-14 16:11:58,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,624 - INFO - Going to convert document batch...
2025-11-14 16:11:58,628 - INFO - Processing document 4_2025-09-15


Converted 'data\edgar_documents\CSCO\4_2025-08-27' --> 'data\processed_data\CSCO\4_2025-08-27.md'
Converted 'data\edgar_documents\CSCO\4_2025-09-11' --> 'data\processed_data\CSCO\4_2025-09-11.md'


2025-11-14 16:11:58,698 - INFO - Finished converting document 4_2025-09-15 in 0.11 sec.
2025-11-14 16:11:58,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,796 - INFO - Going to convert document batch...
2025-11-14 16:11:58,799 - INFO - Processing document 4_2025-09-17
2025-11-14 16:11:58,861 - INFO - Finished converting document 4_2025-09-17 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2025-09-15' --> 'data\processed_data\CSCO\4_2025-09-15.md'
Converted 'data\edgar_documents\CSCO\4_2025-09-17' --> 'data\processed_data\CSCO\4_2025-09-17.md'


2025-11-14 16:11:58,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,970 - INFO - Going to convert document batch...
2025-11-14 16:11:58,972 - INFO - Processing document 4_2025-09-18
2025-11-14 16:11:59,010 - INFO - Finished converting document 4_2025-09-18 in 0.11 sec.
2025-11-14 16:11:59,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,087 - INFO - Going to convert document batch...
2025-11-14 16:11:59,088 - INFO - Processing document 4_2025-09-22
2025-11-14 16:11:59,128 - INFO - Finished converting document 4_2025-09-22 in 0.08 sec.
2025-11-14 16:11:59,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,220 - INFO - Going to convert document batch...
2025-11-14 16:11:59,222 - INFO - Processing document 4_2025-10-14


Converted 'data\edgar_documents\CSCO\4_2025-09-18' --> 'data\processed_data\CSCO\4_2025-09-18.md'
Converted 'data\edgar_documents\CSCO\4_2025-09-22' --> 'data\processed_data\CSCO\4_2025-09-22.md'


2025-11-14 16:11:59,263 - INFO - Finished converting document 4_2025-10-14 in 0.11 sec.
2025-11-14 16:11:59,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,343 - INFO - Going to convert document batch...
2025-11-14 16:11:59,344 - INFO - Processing document 8-K_2023-02-15
2025-11-14 16:11:59,379 - INFO - Finished converting document 8-K_2023-02-15 in 0.08 sec.
2025-11-14 16:11:59,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,470 - INFO - Going to convert document batch...
2025-11-14 16:11:59,471 - INFO - Processing document 8-K_2023-02-21


Converted 'data\edgar_documents\CSCO\4_2025-10-14' --> 'data\processed_data\CSCO\4_2025-10-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-02-15' --> 'data\processed_data\CSCO\8-K_2023-02-15.md'


2025-11-14 16:11:59,497 - INFO - Finished converting document 8-K_2023-02-21 in 0.09 sec.
2025-11-14 16:11:59,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,558 - INFO - Going to convert document batch...
2025-11-14 16:11:59,559 - INFO - Processing document 8-K_2023-03-10
2025-11-14 16:11:59,590 - INFO - Finished converting document 8-K_2023-03-10 in 0.08 sec.
2025-11-14 16:11:59,649 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,680 - INFO - Going to convert document batch...
2025-11-14 16:11:59,683 - INFO - Processing document 8-K_2023-05-17


Converted 'data\edgar_documents\CSCO\8-K_2023-02-21' --> 'data\processed_data\CSCO\8-K_2023-02-21.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-03-10' --> 'data\processed_data\CSCO\8-K_2023-03-10.md'


2025-11-14 16:11:59,753 - INFO - Finished converting document 8-K_2023-05-17 in 0.14 sec.
2025-11-14 16:11:59,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,832 - INFO - Going to convert document batch...
2025-11-14 16:11:59,834 - INFO - Processing document 8-K_2023-07-19
2025-11-14 16:11:59,874 - INFO - Finished converting document 8-K_2023-07-19 in 0.09 sec.
2025-11-14 16:11:59,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\8-K_2023-05-17' --> 'data\processed_data\CSCO\8-K_2023-05-17.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-07-19' --> 'data\processed_data\CSCO\8-K_2023-07-19.md'


2025-11-14 16:11:59,971 - INFO - Going to convert document batch...
2025-11-14 16:11:59,973 - INFO - Processing document 8-K_2023-08-16
2025-11-14 16:12:00,018 - INFO - Finished converting document 8-K_2023-08-16 in 0.11 sec.
2025-11-14 16:12:00,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\8-K_2023-08-16' --> 'data\processed_data\CSCO\8-K_2023-08-16.md'


2025-11-14 16:12:01,155 - INFO - Going to convert document batch...
2025-11-14 16:12:01,156 - INFO - Processing document 8-K_2023-09-21
2025-11-14 16:12:01,224 - INFO - Finished converting document 8-K_2023-09-21 in 1.16 sec.
2025-11-14 16:12:01,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,291 - INFO - Going to convert document batch...
2025-11-14 16:12:01,292 - INFO - Processing document 8-K_2023-09-25
2025-11-14 16:12:01,318 - INFO - Finished converting document 8-K_2023-09-25 in 0.06 sec.
2025-11-14 16:12:01,373 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,402 - INFO - Going to convert document batch...
2025-11-14 16:12:01,403 - INFO - Processing document 8-K_2023-10-10
2025-11-14 16:12:01,432 - INFO - Finished converting document 8-K_2023-10-10 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\8-K_2023-09-21' --> 'data\processed_data\CSCO\8-K_2023-09-21.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-09-25' --> 'data\processed_data\CSCO\8-K_2023-09-25.md'


2025-11-14 16:12:01,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,483 - INFO - Going to convert document batch...
2025-11-14 16:12:01,484 - INFO - Processing document 8-K_2023-11-15
2025-11-14 16:12:01,521 - INFO - Finished converting document 8-K_2023-11-15 in 0.06 sec.
2025-11-14 16:12:01,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,609 - INFO - Going to convert document batch...
2025-11-14 16:12:01,611 - INFO - Processing document 8-K_2023-12-08


Converted 'data\edgar_documents\CSCO\8-K_2023-10-10' --> 'data\processed_data\CSCO\8-K_2023-10-10.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-11-15' --> 'data\processed_data\CSCO\8-K_2023-11-15.md'


2025-11-14 16:12:01,682 - INFO - Finished converting document 8-K_2023-12-08 in 0.14 sec.
2025-11-14 16:12:01,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,770 - INFO - Going to convert document batch...
2025-11-14 16:12:01,771 - INFO - Processing document 8-K_2024-02-08
2025-11-14 16:12:01,834 - INFO - Finished converting document 8-K_2024-02-08 in 0.11 sec.
2025-11-14 16:12:01,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,917 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\8-K_2023-12-08' --> 'data\processed_data\CSCO\8-K_2023-12-08.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-02-08' --> 'data\processed_data\CSCO\8-K_2024-02-08.md'


2025-11-14 16:12:01,918 - INFO - Processing document 8-K_2024-02-14
2025-11-14 16:12:01,951 - INFO - Finished converting document 8-K_2024-02-14 in 0.09 sec.
2025-11-14 16:12:01,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,013 - INFO - Going to convert document batch...
2025-11-14 16:12:02,015 - INFO - Processing document 8-K_2024-02-26
2025-11-14 16:12:02,076 - INFO - Finished converting document 8-K_2024-02-26 in 0.11 sec.
2025-11-14 16:12:02,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,168 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\8-K_2024-02-14' --> 'data\processed_data\CSCO\8-K_2024-02-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-02-26' --> 'data\processed_data\CSCO\8-K_2024-02-26.md'


2025-11-14 16:12:02,169 - INFO - Processing document 8-K_2024-03-18
2025-11-14 16:12:02,224 - INFO - Finished converting document 8-K_2024-03-18 in 0.11 sec.
2025-11-14 16:12:02,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,305 - INFO - Going to convert document batch...
2025-11-14 16:12:02,307 - INFO - Processing document 8-K_2024-05-15
2025-11-14 16:12:02,369 - INFO - Finished converting document 8-K_2024-05-15 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\8-K_2024-03-18' --> 'data\processed_data\CSCO\8-K_2024-03-18.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-05-15' --> 'data\processed_data\CSCO\8-K_2024-05-15.md'


2025-11-14 16:12:02,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,460 - INFO - Going to convert document batch...
2025-11-14 16:12:02,463 - INFO - Processing document 8-K_2024-06-14
2025-11-14 16:12:02,501 - INFO - Finished converting document 8-K_2024-06-14 in 0.09 sec.
2025-11-14 16:12:02,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,567 - INFO - Going to convert document batch...
2025-11-14 16:12:02,568 - INFO - Processing document 8-K_2024-07-19
2025-11-14 16:12:02,603 - INFO - Finished converting document 8-K_2024-07-19 in 0.08 sec.
2025-11-14 16:12:02,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,681 - INFO - Going to convert document batch...
2025-11-14 16:12:02,682 - INFO - Processing document 8-K_2024-08-14


Converted 'data\edgar_documents\CSCO\8-K_2024-06-14' --> 'data\processed_data\CSCO\8-K_2024-06-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-07-19' --> 'data\processed_data\CSCO\8-K_2024-07-19.md'


2025-11-14 16:12:02,733 - INFO - Finished converting document 8-K_2024-08-14 in 0.11 sec.
2025-11-14 16:12:02,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,803 - INFO - Going to convert document batch...
2025-11-14 16:12:02,806 - INFO - Processing document 8-K_2024-10-11
2025-11-14 16:12:02,834 - INFO - Finished converting document 8-K_2024-10-11 in 0.08 sec.
2025-11-14 16:12:02,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,921 - INFO - Going to convert document batch...
2025-11-14 16:12:02,924 - INFO - Processing document 8-K_2024-11-13


Converted 'data\edgar_documents\CSCO\8-K_2024-08-14' --> 'data\processed_data\CSCO\8-K_2024-08-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-10-11' --> 'data\processed_data\CSCO\8-K_2024-10-11.md'


2025-11-14 16:12:02,981 - INFO - Finished converting document 8-K_2024-11-13 in 0.14 sec.
2025-11-14 16:12:03,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,086 - INFO - Going to convert document batch...
2025-11-14 16:12:03,087 - INFO - Processing document 8-K_2024-12-11
2025-11-14 16:12:03,164 - INFO - Finished converting document 8-K_2024-12-11 in 0.14 sec.


Converted 'data\edgar_documents\CSCO\8-K_2024-11-13' --> 'data\processed_data\CSCO\8-K_2024-11-13.md'


2025-11-14 16:12:03,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,234 - INFO - Going to convert document batch...
2025-11-14 16:12:03,235 - INFO - Processing document 8-K_2025-02-12
2025-11-14 16:12:03,284 - INFO - Finished converting document 8-K_2025-02-12 in 0.06 sec.
2025-11-14 16:12:03,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\8-K_2024-12-11' --> 'data\processed_data\CSCO\8-K_2024-12-11.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-02-12' --> 'data\processed_data\CSCO\8-K_2025-02-12.md'


2025-11-14 16:12:03,392 - INFO - Going to convert document batch...
2025-11-14 16:12:03,394 - INFO - Processing document 8-K_2025-02-24
2025-11-14 16:12:03,468 - INFO - Finished converting document 8-K_2025-02-24 in 0.16 sec.
2025-11-14 16:12:03,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,535 - INFO - Going to convert document batch...
2025-11-14 16:12:03,537 - INFO - Processing document 8-K_2025-02-27
2025-11-14 16:12:03,583 - INFO - Finished converting document 8-K_2025-02-27 in 0.08 sec.
2025-11-14 16:12:03,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,661 - INFO - Going to convert document batch...
2025-11-14 16:12:03,663 - INFO - Processing document 8-K_2025-05-13
2025-11-14 16:12:03,705 - INFO - Finished converting document 8-K_2025-05-13 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\8-K_2025-02-24' --> 'data\processed_data\CSCO\8-K_2025-02-24.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-02-27' --> 'data\processed_data\CSCO\8-K_2025-02-27.md'


2025-11-14 16:12:03,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,758 - INFO - Going to convert document batch...
2025-11-14 16:12:03,758 - INFO - Processing document 8-K_2025-05-14
2025-11-14 16:12:03,783 - INFO - Finished converting document 8-K_2025-05-14 in 0.06 sec.
2025-11-14 16:12:03,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,842 - INFO - Going to convert document batch...
2025-11-14 16:12:03,844 - INFO - Processing document 8-K_2025-06-09
2025-11-14 16:12:03,869 - INFO - Finished converting document 8-K_2025-06-09 in 0.06 sec.


Converted 'data\edgar_documents\CSCO\8-K_2025-05-13' --> 'data\processed_data\CSCO\8-K_2025-05-13.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-05-14' --> 'data\processed_data\CSCO\8-K_2025-05-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-06-09' --> 'data\processed_data\CSCO\8-K_2025-06-09.md'


2025-11-14 16:12:03,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,967 - INFO - Going to convert document batch...
2025-11-14 16:12:03,968 - INFO - Processing document 8-K_2025-08-13
2025-11-14 16:12:04,004 - INFO - Finished converting document 8-K_2025-08-13 in 0.11 sec.
2025-11-14 16:12:04,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:04,056 - INFO - Going to convert document batch...
2025-11-14 16:12:04,058 - INFO - Processing document 8-K_2025-08-25
2025-11-14 16:12:04,110 - INFO - Finished converting document 8-K_2025-08-25 in 0.09 sec.
2025-11-14 16:12:04,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:04,195 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\8-K_2025-08-13' --> 'data\processed_data\CSCO\8-K_2025-08-13.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-08-25' --> 'data\processed_data\CSCO\8-K_2025-08-25.md'


2025-11-14 16:12:04,197 - INFO - Processing document 8-K_2025-10-17
2025-11-14 16:12:04,254 - INFO - Finished converting document 8-K_2025-10-17 in 0.11 sec.
2025-11-14 16:12:04,376 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:12:04,379 - ERROR - Input document DEF-14A_2023-10-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:12:04,385 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\8-K_2025-10-17' --> 'data\processed_data\CSCO\8-K_2025-10-17.md'
Error processing data\edgar_documents\CSCO\DEF-14A_2023-10-17: File format not allowed: data\edgar_documents\CSCO\DEF-14A_2023-10-17


2025-11-14 16:12:04,463 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:12:04,466 - ERROR - Input document DEF-14A_2024-10-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:12:04,472 - INFO - Going to convert document batch...
2025-11-14 16:12:04,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\CSCO\DEF-14A_2024-10-18: File format not allowed: data\edgar_documents\CSCO\DEF-14A_2024-10-18


2025-11-14 16:12:05,673 - INFO - Going to convert document batch...
2025-11-14 16:12:05,674 - INFO - Processing document DEF-14A_2025-10-28
2025-11-14 16:12:10,551 - INFO - Finished converting document DEF-14A_2025-10-28 in 6.08 sec.
2025-11-14 16:12:12,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\DEF-14A_2025-10-28' --> 'data\processed_data\CSCO\DEF-14A_2025-10-28.md'
Processed 122 new files. Errors: 6
Found 112 files to process in data\edgar_documents\CVS


2025-11-14 16:12:15,996 - INFO - Going to convert document batch...
2025-11-14 16:12:15,998 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:12:15,999 - INFO - Processing document 10-K_2023-02-08
2025-11-14 16:12:27,447 - INFO - Finished converting document 10-K_2023-02-08 in 15.08 sec.
2025-11-14 16:12:30,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-K_2023-02-08' --> 'data\processed_data\CVS\10-K_2023-02-08.md'


2025-11-14 16:12:34,438 - INFO - Going to convert document batch...
2025-11-14 16:12:34,439 - INFO - Processing document 10-K_2024-02-07
2025-11-14 16:12:48,257 - INFO - Finished converting document 10-K_2024-02-07 in 17.92 sec.
2025-11-14 16:12:51,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-K_2024-02-07' --> 'data\processed_data\CVS\10-K_2024-02-07.md'


2025-11-14 16:12:55,097 - INFO - Going to convert document batch...
2025-11-14 16:12:55,099 - INFO - Processing document 10-K_2025-02-12
2025-11-14 16:13:08,019 - INFO - Finished converting document 10-K_2025-02-12 in 17.09 sec.
2025-11-14 16:13:10,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-K_2025-02-12' --> 'data\processed_data\CVS\10-K_2025-02-12.md'


2025-11-14 16:13:13,657 - INFO - Going to convert document batch...
2025-11-14 16:13:13,658 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 16:13:17,618 - INFO - Finished converting document 10-Q_2023-05-03 in 6.97 sec.
2025-11-14 16:13:19,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2023-05-03' --> 'data\processed_data\CVS\10-Q_2023-05-03.md'


2025-11-14 16:13:22,814 - INFO - Going to convert document batch...
2025-11-14 16:13:22,816 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 16:13:27,696 - INFO - Finished converting document 10-Q_2023-08-02 in 8.50 sec.
2025-11-14 16:13:29,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2023-08-02' --> 'data\processed_data\CVS\10-Q_2023-08-02.md'


2025-11-14 16:13:33,210 - INFO - Going to convert document batch...
2025-11-14 16:13:33,212 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 16:13:38,186 - INFO - Finished converting document 10-Q_2023-11-01 in 8.52 sec.
2025-11-14 16:13:40,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2023-11-01' --> 'data\processed_data\CVS\10-Q_2023-11-01.md'


2025-11-14 16:13:42,657 - INFO - Going to convert document batch...
2025-11-14 16:13:42,659 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 16:13:45,620 - INFO - Finished converting document 10-Q_2024-05-01 in 5.52 sec.
2025-11-14 16:13:47,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2024-05-01' --> 'data\processed_data\CVS\10-Q_2024-05-01.md'


2025-11-14 16:13:49,737 - INFO - Going to convert document batch...
2025-11-14 16:13:49,738 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 16:13:53,358 - INFO - Finished converting document 10-Q_2024-08-07 in 6.33 sec.
2025-11-14 16:13:55,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2024-08-07' --> 'data\processed_data\CVS\10-Q_2024-08-07.md'


2025-11-14 16:13:57,423 - INFO - Going to convert document batch...
2025-11-14 16:13:57,424 - INFO - Processing document 10-Q_2024-11-06
2025-11-14 16:14:01,715 - INFO - Finished converting document 10-Q_2024-11-06 in 6.80 sec.
2025-11-14 16:14:03,391 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2024-11-06' --> 'data\processed_data\CVS\10-Q_2024-11-06.md'


2025-11-14 16:14:04,843 - INFO - Going to convert document batch...
2025-11-14 16:14:04,846 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 16:14:07,475 - INFO - Finished converting document 10-Q_2025-05-01 in 4.12 sec.
2025-11-14 16:14:10,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2025-05-01' --> 'data\processed_data\CVS\10-Q_2025-05-01.md'


2025-11-14 16:14:11,916 - INFO - Going to convert document batch...
2025-11-14 16:14:11,918 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 16:14:16,629 - INFO - Finished converting document 10-Q_2025-07-31 in 6.62 sec.
2025-11-14 16:14:18,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2025-07-31' --> 'data\processed_data\CVS\10-Q_2025-07-31.md'


2025-11-14 16:14:20,534 - INFO - Going to convert document batch...
2025-11-14 16:14:20,536 - INFO - Processing document 10-Q_2025-10-29
2025-11-14 16:14:25,955 - INFO - Finished converting document 10-Q_2025-10-29 in 7.55 sec.
2025-11-14 16:14:27,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:27,961 - INFO - Going to convert document batch...
2025-11-14 16:14:27,962 - INFO - Processing document 4_2023-01-04
2025-11-14 16:14:28,049 - INFO - Finished converting document 4_2023-01-04 in 0.14 sec.


Converted 'data\edgar_documents\CVS\10-Q_2025-10-29' --> 'data\processed_data\CVS\10-Q_2025-10-29.md'


2025-11-14 16:14:28,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:28,197 - INFO - Going to convert document batch...
2025-11-14 16:14:28,199 - INFO - Processing document 4_2023-02-03
2025-11-14 16:14:28,279 - INFO - Finished converting document 4_2023-02-03 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2023-01-04' --> 'data\processed_data\CVS\4_2023-01-04.md'
Converted 'data\edgar_documents\CVS\4_2023-02-03' --> 'data\processed_data\CVS\4_2023-02-03.md'


2025-11-14 16:14:28,387 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:28,389 - ERROR - Input document 4_2023-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:28,392 - INFO - Going to convert document batch...
2025-11-14 16:14:28,434 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:28,438 - ERROR - Input document 4_2023-02-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\CVS\4_2023-02-13: File format not allowed: data\edgar_documents\CVS\4_2023-02-13
Error processing data\edgar_documents\CVS\4_2023-02-15: File format not allowed: data\edgar_documents\CVS\4_2023-02-15
Converted 'data\edgar_documents\CVS\4_2023-03-01' --> 'data\processed_data\CVS\4_2023-03-01.md'


2025-11-14 16:14:28,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:28,663 - INFO - Going to convert document batch...
2025-11-14 16:14:28,665 - INFO - Processing document 4_2023-04-04
2025-11-14 16:14:28,755 - INFO - Finished converting document 4_2023-04-04 in 0.17 sec.
2025-11-14 16:14:28,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:28,886 - INFO - Going to convert document batch...
2025-11-14 16:14:28,888 - INFO - Processing document 4_2023-05-05
2025-11-14 16:14:28,976 - INFO - Finished converting document 4_2023-05-05 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2023-04-04' --> 'data\processed_data\CVS\4_2023-04-04.md'


2025-11-14 16:14:29,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:29,107 - INFO - Going to convert document batch...
2025-11-14 16:14:29,109 - INFO - Processing document 4_2023-05-19
2025-11-14 16:14:29,167 - INFO - Finished converting document 4_2023-05-19 in 0.11 sec.
2025-11-14 16:14:29,263 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\CVS\4_2023-05-05' --> 'data\processed_data\CVS\4_2023-05-05.md'
Converted 'data\edgar_documents\CVS\4_2023-05-19' --> 'data\processed_data\CVS\4_2023-05-19.md'


2025-11-14 16:14:29,265 - ERROR - Input document 4_2023-05-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:29,267 - INFO - Going to convert document batch...
2025-11-14 16:14:29,292 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:29,299 - ERROR - Input document 4_2023-06-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\CVS\4_2023-05-30: File format not allowed: data\edgar_documents\CVS\4_2023-05-30
Error processing data\edgar_documents\CVS\4_2023-06-01: File format not allowed: data\edgar_documents\CVS\4_2023-06-01


2025-11-14 16:14:29,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:29,565 - INFO - Going to convert document batch...
2025-11-14 16:14:29,567 - INFO - Processing document 4_2023-09-01
2025-11-14 16:14:29,649 - INFO - Finished converting document 4_2023-09-01 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2023-08-04' --> 'data\processed_data\CVS\4_2023-08-04.md'


2025-11-14 16:14:29,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:29,771 - INFO - Going to convert document batch...
2025-11-14 16:14:29,772 - INFO - Processing document 4_2023-10-02
2025-11-14 16:14:29,827 - INFO - Finished converting document 4_2023-10-02 in 0.09 sec.
2025-11-14 16:14:29,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:29,927 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVS\4_2023-09-01' --> 'data\processed_data\CVS\4_2023-09-01.md'
Converted 'data\edgar_documents\CVS\4_2023-10-02' --> 'data\processed_data\CVS\4_2023-10-02.md'


2025-11-14 16:14:29,929 - INFO - Processing document 4_2023-11-06
2025-11-14 16:14:29,997 - INFO - Finished converting document 4_2023-11-06 in 0.12 sec.
2025-11-14 16:14:30,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:30,073 - INFO - Going to convert document batch...
2025-11-14 16:14:30,074 - INFO - Processing document 4_2023-11-17
2025-11-14 16:14:30,115 - INFO - Finished converting document 4_2023-11-17 in 0.08 sec.
2025-11-14 16:14:30,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\4_2023-11-06' --> 'data\processed_data\CVS\4_2023-11-06.md'
Converted 'data\edgar_documents\CVS\4_2023-11-17' --> 'data\processed_data\CVS\4_2023-11-17.md'


2025-11-14 16:14:30,223 - INFO - Going to convert document batch...
2025-11-14 16:14:30,225 - INFO - Processing document 4_2023-12-01
2025-11-14 16:14:30,296 - INFO - Finished converting document 4_2023-12-01 in 0.12 sec.
2025-11-14 16:14:30,373 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:30,399 - INFO - Going to convert document batch...
2025-11-14 16:14:30,401 - INFO - Processing document 4_2023-12-08
2025-11-14 16:14:30,457 - INFO - Finished converting document 4_2023-12-08 in 0.11 sec.


Converted 'data\edgar_documents\CVS\4_2023-12-01' --> 'data\processed_data\CVS\4_2023-12-01.md'
Converted 'data\edgar_documents\CVS\4_2023-12-08' --> 'data\processed_data\CVS\4_2023-12-08.md'


2025-11-14 16:14:30,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:30,596 - INFO - Going to convert document batch...
2025-11-14 16:14:30,598 - INFO - Processing document 4_2023-12-15
2025-11-14 16:14:30,685 - INFO - Finished converting document 4_2023-12-15 in 0.17 sec.
2025-11-14 16:14:30,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:30,811 - INFO - Going to convert document batch...
2025-11-14 16:14:30,814 - INFO - Processing document 4_2024-02-14
2025-11-14 16:14:30,892 - INFO - Finished converting document 4_2024-02-14 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2023-12-15' --> 'data\processed_data\CVS\4_2023-12-15.md'


2025-11-14 16:14:30,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,024 - INFO - Going to convert document batch...
2025-11-14 16:14:31,026 - INFO - Processing document 4_2024-02-16
2025-11-14 16:14:31,111 - INFO - Finished converting document 4_2024-02-16 in 0.16 sec.


Converted 'data\edgar_documents\CVS\4_2024-02-14' --> 'data\processed_data\CVS\4_2024-02-14.md'


2025-11-14 16:14:31,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,225 - INFO - Going to convert document batch...
2025-11-14 16:14:31,227 - INFO - Processing document 4_2024-02-28
2025-11-14 16:14:31,281 - INFO - Finished converting document 4_2024-02-28 in 0.11 sec.


Converted 'data\edgar_documents\CVS\4_2024-02-16' --> 'data\processed_data\CVS\4_2024-02-16.md'
Converted 'data\edgar_documents\CVS\4_2024-02-28' --> 'data\processed_data\CVS\4_2024-02-28.md'


2025-11-14 16:14:31,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,418 - INFO - Going to convert document batch...
2025-11-14 16:14:31,419 - INFO - Processing document 4_2024-03-01
2025-11-14 16:14:31,464 - INFO - Finished converting document 4_2024-03-01 in 0.12 sec.
2025-11-14 16:14:31,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,536 - INFO - Going to convert document batch...
2025-11-14 16:14:31,537 - INFO - Processing document 4_2024-04-03
2025-11-14 16:14:31,572 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 16:14:31,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,665 - INFO - Going to convert document batch...
2025-11-14 16:14:31,668 - INFO - Processing document 4_2024-05-02


Converted 'data\edgar_documents\CVS\4_2024-03-01' --> 'data\processed_data\CVS\4_2024-03-01.md'
Converted 'data\edgar_documents\CVS\4_2024-04-03' --> 'data\processed_data\CVS\4_2024-04-03.md'


2025-11-14 16:14:31,725 - INFO - Finished converting document 4_2024-05-02 in 0.11 sec.
2025-11-14 16:14:31,802 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:31,803 - ERROR - Input document 4_2024-05-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:31,805 - INFO - Going to convert document batch...
2025-11-14 16:14:31,852 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:31,854 - ERROR - Input document 4_2024-05-08 with forma

Converted 'data\edgar_documents\CVS\4_2024-05-02' --> 'data\processed_data\CVS\4_2024-05-02.md'
Error processing data\edgar_documents\CVS\4_2024-05-07: File format not allowed: data\edgar_documents\CVS\4_2024-05-07
Error processing data\edgar_documents\CVS\4_2024-05-08: File format not allowed: data\edgar_documents\CVS\4_2024-05-08


2025-11-14 16:14:31,965 - INFO - Finished converting document 4_2024-05-17 in 0.11 sec.
2025-11-14 16:14:32,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,054 - INFO - Going to convert document batch...
2025-11-14 16:14:32,056 - INFO - Processing document 4_2024-09-03
2025-11-14 16:14:32,108 - INFO - Finished converting document 4_2024-09-03 in 0.08 sec.
2025-11-14 16:14:32,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,222 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVS\4_2024-05-17' --> 'data\processed_data\CVS\4_2024-05-17.md'
Converted 'data\edgar_documents\CVS\4_2024-09-03' --> 'data\processed_data\CVS\4_2024-09-03.md'


2025-11-14 16:14:32,224 - INFO - Processing document 4_2024-11-25
2025-11-14 16:14:32,301 - INFO - Finished converting document 4_2024-11-25 in 0.14 sec.
2025-11-14 16:14:32,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,425 - INFO - Going to convert document batch...
2025-11-14 16:14:32,433 - INFO - Processing document 4_2024-12-03
2025-11-14 16:14:32,532 - INFO - Finished converting document 4_2024-12-03 in 0.17 sec.


Converted 'data\edgar_documents\CVS\4_2024-11-25' --> 'data\processed_data\CVS\4_2024-11-25.md'


2025-11-14 16:14:32,613 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:32,614 - ERROR - Input document 4_2024-12-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:32,616 - INFO - Going to convert document batch...
2025-11-14 16:14:32,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,676 - INFO - Going to convert document batch...
2025-11-14 16:14:32,678 - INFO - Processing document 4_2024-12-09
2025-11-14 16:14:32,720 - INFO - Fin

Converted 'data\edgar_documents\CVS\4_2024-12-03' --> 'data\processed_data\CVS\4_2024-12-03.md'
Error processing data\edgar_documents\CVS\4_2024-12-05: File format not allowed: data\edgar_documents\CVS\4_2024-12-05


2025-11-14 16:14:32,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,841 - INFO - Going to convert document batch...
2025-11-14 16:14:32,844 - INFO - Processing document 4_2024-12-26
2025-11-14 16:14:32,921 - INFO - Finished converting document 4_2024-12-26 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2024-12-09' --> 'data\processed_data\CVS\4_2024-12-09.md'


2025-11-14 16:14:33,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,031 - INFO - Going to convert document batch...
2025-11-14 16:14:33,032 - INFO - Processing document 4_2025-02-19
2025-11-14 16:14:33,097 - INFO - Finished converting document 4_2025-02-19 in 0.11 sec.
2025-11-14 16:14:33,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\4_2024-12-26' --> 'data\processed_data\CVS\4_2024-12-26.md'
Converted 'data\edgar_documents\CVS\4_2025-02-19' --> 'data\processed_data\CVS\4_2025-02-19.md'


2025-11-14 16:14:33,199 - INFO - Going to convert document batch...
2025-11-14 16:14:33,200 - INFO - Processing document 4_2025-03-03
2025-11-14 16:14:33,243 - INFO - Finished converting document 4_2025-03-03 in 0.08 sec.
2025-11-14 16:14:33,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,370 - INFO - Going to convert document batch...
2025-11-14 16:14:33,372 - INFO - Processing document 4_2025-03-07
2025-11-14 16:14:33,431 - INFO - Finished converting document 4_2025-03-07 in 0.11 sec.


Converted 'data\edgar_documents\CVS\4_2025-03-03' --> 'data\processed_data\CVS\4_2025-03-03.md'
Converted 'data\edgar_documents\CVS\4_2025-03-07' --> 'data\processed_data\CVS\4_2025-03-07.md'


2025-11-14 16:14:33,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,540 - INFO - Going to convert document batch...
2025-11-14 16:14:33,541 - INFO - Processing document 4_2025-03-14
2025-11-14 16:14:33,606 - INFO - Finished converting document 4_2025-03-14 in 0.12 sec.
2025-11-14 16:14:33,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,706 - INFO - Going to convert document batch...
2025-11-14 16:14:33,707 - INFO - Processing document 4_2025-03-18
2025-11-14 16:14:33,739 - INFO - Finished converting document 4_2025-03-18 in 0.06 sec.
2025-11-14 16:14:33,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,835 - INFO - Going to convert document batch...
2025-11-14 16:14:33,836 - INFO - Processing document 4_2025-04-03


Converted 'data\edgar_documents\CVS\4_2025-03-14' --> 'data\processed_data\CVS\4_2025-03-14.md'
Converted 'data\edgar_documents\CVS\4_2025-03-18' --> 'data\processed_data\CVS\4_2025-03-18.md'


2025-11-14 16:14:33,894 - INFO - Finished converting document 4_2025-04-03 in 0.12 sec.
2025-11-14 16:14:33,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,020 - INFO - Going to convert document batch...
2025-11-14 16:14:34,022 - INFO - Processing document 4_2025-05-06
2025-11-14 16:14:34,101 - INFO - Finished converting document 4_2025-05-06 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2025-04-03' --> 'data\processed_data\CVS\4_2025-04-03.md'


2025-11-14 16:14:34,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,240 - INFO - Going to convert document batch...
2025-11-14 16:14:34,241 - INFO - Processing document 4_2025-05-09
2025-11-14 16:14:34,304 - INFO - Finished converting document 4_2025-05-09 in 0.12 sec.


Converted 'data\edgar_documents\CVS\4_2025-05-06' --> 'data\processed_data\CVS\4_2025-05-06.md'
Converted 'data\edgar_documents\CVS\4_2025-05-09' --> 'data\processed_data\CVS\4_2025-05-09.md'


2025-11-14 16:14:34,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,409 - INFO - Going to convert document batch...
2025-11-14 16:14:34,411 - INFO - Processing document 4_2025-05-19
2025-11-14 16:14:34,518 - INFO - Finished converting document 4_2025-05-19 in 0.14 sec.
2025-11-14 16:14:34,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,643 - INFO - Going to convert document batch...
2025-11-14 16:14:34,643 - INFO - Processing document 4_2025-06-03
2025-11-14 16:14:34,678 - INFO - Finished converting document 4_2025-06-03 in 0.06 sec.
2025-11-14 16:14:34,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,775 - INFO - Going to convert document batch...
2025-11-14 16:14:34,777 - INFO - Processing document 4_2025-06-09


Converted 'data\edgar_documents\CVS\4_2025-05-19' --> 'data\processed_data\CVS\4_2025-05-19.md'
Converted 'data\edgar_documents\CVS\4_2025-06-03' --> 'data\processed_data\CVS\4_2025-06-03.md'


2025-11-14 16:14:34,830 - INFO - Finished converting document 4_2025-06-09 in 0.11 sec.
2025-11-14 16:14:34,926 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:34,928 - ERROR - Input document 4_2025-08-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:34,932 - INFO - Going to convert document batch...
2025-11-14 16:14:34,967 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:34,969 - ERROR - Input document 4_2025-08-12 with forma

Converted 'data\edgar_documents\CVS\4_2025-06-09' --> 'data\processed_data\CVS\4_2025-06-09.md'
Error processing data\edgar_documents\CVS\4_2025-08-11: File format not allowed: data\edgar_documents\CVS\4_2025-08-11
Error processing data\edgar_documents\CVS\4_2025-08-12: File format not allowed: data\edgar_documents\CVS\4_2025-08-12


2025-11-14 16:14:35,080 - INFO - Finished converting document 4_2025-08-29 in 0.11 sec.
2025-11-14 16:14:35,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,170 - INFO - Going to convert document batch...
2025-11-14 16:14:35,171 - INFO - Processing document 4_2025-09-02
2025-11-14 16:14:35,203 - INFO - Finished converting document 4_2025-09-02 in 0.06 sec.
2025-11-14 16:14:35,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,292 - INFO - Going to convert document batch...
2025-11-14 16:14:35,293 - INFO - Processing document 4_2025-10-14


Converted 'data\edgar_documents\CVS\4_2025-08-29' --> 'data\processed_data\CVS\4_2025-08-29.md'
Converted 'data\edgar_documents\CVS\4_2025-09-02' --> 'data\processed_data\CVS\4_2025-09-02.md'


2025-11-14 16:14:35,349 - INFO - Finished converting document 4_2025-10-14 in 0.11 sec.
2025-11-14 16:14:35,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,461 - INFO - Going to convert document batch...
2025-11-14 16:14:35,463 - INFO - Processing document 8-K_2023-01-09
2025-11-14 16:14:35,511 - INFO - Finished converting document 8-K_2023-01-09 in 0.12 sec.
2025-11-14 16:14:35,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\4_2025-10-14' --> 'data\processed_data\CVS\4_2025-10-14.md'
Converted 'data\edgar_documents\CVS\8-K_2023-01-09' --> 'data\processed_data\CVS\8-K_2023-01-09.md'


2025-11-14 16:14:35,596 - INFO - Going to convert document batch...
2025-11-14 16:14:35,598 - INFO - Processing document 8-K_2023-01-23
2025-11-14 16:14:35,660 - INFO - Finished converting document 8-K_2023-01-23 in 0.11 sec.
2025-11-14 16:14:35,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,761 - INFO - Going to convert document batch...
2025-11-14 16:14:35,762 - INFO - Processing document 8-K_2023-02-08
2025-11-14 16:14:35,821 - INFO - Finished converting document 8-K_2023-02-08 in 0.12 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-01-23' --> 'data\processed_data\CVS\8-K_2023-01-23.md'


2025-11-14 16:14:35,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,967 - INFO - Going to convert document batch...
2025-11-14 16:14:35,968 - INFO - Processing document 8-K_2023-02-15
2025-11-14 16:14:36,026 - INFO - Finished converting document 8-K_2023-02-15 in 0.14 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-02-08' --> 'data\processed_data\CVS\8-K_2023-02-08.md'
Converted 'data\edgar_documents\CVS\8-K_2023-02-15' --> 'data\processed_data\CVS\8-K_2023-02-15.md'


2025-11-14 16:14:36,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:36,133 - INFO - Going to convert document batch...
2025-11-14 16:14:36,135 - INFO - Processing document 8-K_2023-02-21
2025-11-14 16:14:36,207 - INFO - Finished converting document 8-K_2023-02-21 in 0.14 sec.
2025-11-14 16:14:36,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:36,275 - INFO - Going to convert document batch...
2025-11-14 16:14:36,276 - INFO - Processing document 8-K_2023-03-30
2025-11-14 16:14:36,301 - INFO - Finished converting document 8-K_2023-03-30 in 0.06 sec.
2025-11-14 16:14:36,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:36,387 - INFO - Going to convert document batch...
2025-11-14 16:14:36,388 - INFO - Processing document 8-K_2023-05-02


Converted 'data\edgar_documents\CVS\8-K_2023-02-21' --> 'data\processed_data\CVS\8-K_2023-02-21.md'
Converted 'data\edgar_documents\CVS\8-K_2023-03-30' --> 'data\processed_data\CVS\8-K_2023-03-30.md'


2025-11-14 16:14:36,459 - INFO - Finished converting document 8-K_2023-05-02 in 0.12 sec.
2025-11-14 16:14:36,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:36,575 - INFO - Going to convert document batch...
2025-11-14 16:14:36,578 - INFO - Processing document 8-K_2023-05-03
2025-11-14 16:14:36,613 - INFO - Finished converting document 8-K_2023-05-03 in 0.09 sec.
2025-11-14 16:14:36,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-05-02' --> 'data\processed_data\CVS\8-K_2023-05-02.md'
Converted 'data\edgar_documents\CVS\8-K_2023-05-03' --> 'data\processed_data\CVS\8-K_2023-05-03.md'


2025-11-14 16:14:36,721 - INFO - Going to convert document batch...
2025-11-14 16:14:36,723 - INFO - Processing document 8-K_2023-05-24
2025-11-14 16:14:36,808 - INFO - Finished converting document 8-K_2023-05-24 in 0.19 sec.
2025-11-14 16:14:36,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-05-24' --> 'data\processed_data\CVS\8-K_2023-05-24.md'


2025-11-14 16:14:37,339 - INFO - Going to convert document batch...
2025-11-14 16:14:37,341 - INFO - Processing document 8-K_2023-05-25
2025-11-14 16:14:38,791 - INFO - Finished converting document 8-K_2023-05-25 in 1.92 sec.
2025-11-14 16:14:38,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:38,907 - INFO - Going to convert document batch...
2025-11-14 16:14:38,908 - INFO - Processing document 8-K_2023-05-31
2025-11-14 16:14:38,952 - INFO - Finished converting document 8-K_2023-05-31 in 0.12 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-05-25' --> 'data\processed_data\CVS\8-K_2023-05-25.md'
Converted 'data\edgar_documents\CVS\8-K_2023-05-31' --> 'data\processed_data\CVS\8-K_2023-05-31.md'


2025-11-14 16:14:39,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:39,068 - INFO - Going to convert document batch...
2025-11-14 16:14:39,070 - INFO - Processing document 8-K_2023-06-01
2025-11-14 16:14:39,131 - INFO - Finished converting document 8-K_2023-06-01 in 0.14 sec.
2025-11-14 16:14:39,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:39,214 - INFO - Going to convert document batch...
2025-11-14 16:14:39,217 - INFO - Processing document 8-K_2023-06-02
2025-11-14 16:14:39,270 - INFO - Finished converting document 8-K_2023-06-02 in 0.11 sec.
2025-11-14 16:14:39,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-06-01' --> 'data\processed_data\CVS\8-K_2023-06-01.md'
Converted 'data\edgar_documents\CVS\8-K_2023-06-02' --> 'data\processed_data\CVS\8-K_2023-06-02.md'


2025-11-14 16:14:39,361 - INFO - Going to convert document batch...
2025-11-14 16:14:39,363 - INFO - Processing document 8-K_2023-07-20
2025-11-14 16:14:39,421 - INFO - Finished converting document 8-K_2023-07-20 in 0.14 sec.
2025-11-14 16:14:39,478 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:39,511 - INFO - Going to convert document batch...
2025-11-14 16:14:39,512 - INFO - Processing document 8-K_2023-08-02
2025-11-14 16:14:39,553 - INFO - Finished converting document 8-K_2023-08-02 in 0.08 sec.
2025-11-14 16:14:39,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-07-20' --> 'data\processed_data\CVS\8-K_2023-07-20.md'
Converted 'data\edgar_documents\CVS\8-K_2023-08-02' --> 'data\processed_data\CVS\8-K_2023-08-02.md'


2025-11-14 16:14:39,669 - INFO - Going to convert document batch...
2025-11-14 16:14:39,672 - INFO - Processing document 8-K_2023-08-17
2025-11-14 16:14:39,729 - INFO - Finished converting document 8-K_2023-08-17 in 0.14 sec.
2025-11-14 16:14:39,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:39,847 - INFO - Going to convert document batch...
2025-11-14 16:14:39,849 - INFO - Processing document 8-K_2023-08-23
2025-11-14 16:14:39,929 - INFO - Finished converting document 8-K_2023-08-23 in 0.14 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-08-17' --> 'data\processed_data\CVS\8-K_2023-08-17.md'
Converted 'data\edgar_documents\CVS\8-K_2023-08-23' --> 'data\processed_data\CVS\8-K_2023-08-23.md'


2025-11-14 16:14:40,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,075 - INFO - Going to convert document batch...
2025-11-14 16:14:40,078 - INFO - Processing document 8-K_2023-09-11
2025-11-14 16:14:40,167 - INFO - Finished converting document 8-K_2023-09-11 in 0.20 sec.
2025-11-14 16:14:40,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,239 - INFO - Going to convert document batch...
2025-11-14 16:14:40,240 - INFO - Processing document 8-K_2023-09-21
2025-11-14 16:14:40,293 - INFO - Finished converting document 8-K_2023-09-21 in 0.09 sec.
2025-11-14 16:14:40,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-09-11' --> 'data\processed_data\CVS\8-K_2023-09-11.md'
Converted 'data\edgar_documents\CVS\8-K_2023-09-21' --> 'data\processed_data\CVS\8-K_2023-09-21.md'


2025-11-14 16:14:40,403 - INFO - Going to convert document batch...
2025-11-14 16:14:40,405 - INFO - Processing document 8-K_2023-10-13
2025-11-14 16:14:40,452 - INFO - Finished converting document 8-K_2023-10-13 in 0.12 sec.
2025-11-14 16:14:40,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,546 - INFO - Going to convert document batch...
2025-11-14 16:14:40,547 - INFO - Processing document 8-K_2023-10-16
2025-11-14 16:14:40,619 - INFO - Finished converting document 8-K_2023-10-16 in 0.12 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-10-13' --> 'data\processed_data\CVS\8-K_2023-10-13.md'


2025-11-14 16:14:40,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,730 - INFO - Going to convert document batch...
2025-11-14 16:14:40,731 - INFO - Processing document 8-K_2023-11-01
2025-11-14 16:14:40,768 - INFO - Finished converting document 8-K_2023-11-01 in 0.09 sec.
2025-11-14 16:14:40,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,845 - INFO - Going to convert document batch...
2025-11-14 16:14:40,847 - INFO - Processing document 8-K_2023-12-05


Converted 'data\edgar_documents\CVS\8-K_2023-10-16' --> 'data\processed_data\CVS\8-K_2023-10-16.md'
Converted 'data\edgar_documents\CVS\8-K_2023-11-01' --> 'data\processed_data\CVS\8-K_2023-11-01.md'


2025-11-14 16:14:40,890 - INFO - Finished converting document 8-K_2023-12-05 in 0.09 sec.
2025-11-14 16:14:40,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,015 - INFO - Going to convert document batch...
2025-11-14 16:14:41,017 - INFO - Processing document 8-K_2024-01-05
2025-11-14 16:14:41,102 - INFO - Finished converting document 8-K_2024-01-05 in 0.17 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-12-05' --> 'data\processed_data\CVS\8-K_2023-12-05.md'


2025-11-14 16:14:41,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,220 - INFO - Going to convert document batch...
2025-11-14 16:14:41,223 - INFO - Processing document 8-K_2024-02-07
2025-11-14 16:14:41,286 - INFO - Finished converting document 8-K_2024-02-07 in 0.11 sec.
2025-11-14 16:14:41,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2024-01-05' --> 'data\processed_data\CVS\8-K_2024-01-05.md'
Converted 'data\edgar_documents\CVS\8-K_2024-02-07' --> 'data\processed_data\CVS\8-K_2024-02-07.md'


2025-11-14 16:14:41,401 - INFO - Going to convert document batch...
2025-11-14 16:14:41,403 - INFO - Processing document 8-K_2024-03-05
2025-11-14 16:14:41,498 - INFO - Finished converting document 8-K_2024-03-05 in 0.19 sec.
2025-11-14 16:14:41,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,591 - INFO - Going to convert document batch...
2025-11-14 16:14:41,594 - INFO - Processing document 8-K_2024-05-01
2025-11-14 16:14:41,645 - INFO - Finished converting document 8-K_2024-05-01 in 0.11 sec.
2025-11-14 16:14:41,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,727 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVS\8-K_2024-03-05' --> 'data\processed_data\CVS\8-K_2024-03-05.md'
Converted 'data\edgar_documents\CVS\8-K_2024-05-01' --> 'data\processed_data\CVS\8-K_2024-05-01.md'


2025-11-14 16:14:41,729 - INFO - Processing document 8-K_2024-05-08
2025-11-14 16:14:41,798 - INFO - Finished converting document 8-K_2024-05-08 in 0.12 sec.
2025-11-14 16:14:41,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,878 - INFO - Going to convert document batch...
2025-11-14 16:14:41,879 - INFO - Processing document 8-K_2024-05-09
2025-11-14 16:14:41,937 - INFO - Finished converting document 8-K_2024-05-09 in 0.12 sec.
2025-11-14 16:14:42,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2024-05-08' --> 'data\processed_data\CVS\8-K_2024-05-08.md'
Converted 'data\edgar_documents\CVS\8-K_2024-05-09' --> 'data\processed_data\CVS\8-K_2024-05-09.md'


2025-11-14 16:14:42,060 - INFO - Going to convert document batch...
2025-11-14 16:14:42,062 - INFO - Processing document 8-K_2024-05-22
2025-11-14 16:14:42,138 - INFO - Finished converting document 8-K_2024-05-22 in 0.17 sec.
2025-11-14 16:14:42,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,205 - INFO - Going to convert document batch...
2025-11-14 16:14:42,207 - INFO - Processing document 8-K_2024-08-07
2025-11-14 16:14:42,260 - INFO - Finished converting document 8-K_2024-08-07 in 0.08 sec.
2025-11-14 16:14:42,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,353 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVS\8-K_2024-05-22' --> 'data\processed_data\CVS\8-K_2024-05-22.md'
Converted 'data\edgar_documents\CVS\8-K_2024-08-07' --> 'data\processed_data\CVS\8-K_2024-08-07.md'


2025-11-14 16:14:42,355 - INFO - Processing document 8-K_2024-10-18
2025-11-14 16:14:42,395 - INFO - Finished converting document 8-K_2024-10-18 in 0.11 sec.
2025-11-14 16:14:42,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,463 - INFO - Going to convert document batch...
2025-11-14 16:14:42,465 - INFO - Processing document 8-K_2024-11-06
2025-11-14 16:14:42,497 - INFO - Finished converting document 8-K_2024-11-06 in 0.09 sec.
2025-11-14 16:14:42,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,584 - INFO - Going to convert document batch...
2025-11-14 16:14:42,586 - INFO - Processing document 8-K_2024-11-18


Converted 'data\edgar_documents\CVS\8-K_2024-10-18' --> 'data\processed_data\CVS\8-K_2024-10-18.md'
Converted 'data\edgar_documents\CVS\8-K_2024-11-06' --> 'data\processed_data\CVS\8-K_2024-11-06.md'


2025-11-14 16:14:42,636 - INFO - Finished converting document 8-K_2024-11-18 in 0.12 sec.
2025-11-14 16:14:42,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,727 - INFO - Going to convert document batch...
2025-11-14 16:14:42,731 - INFO - Processing document 8-K_2024-12-02
2025-11-14 16:14:42,789 - INFO - Finished converting document 8-K_2024-12-02 in 0.11 sec.
2025-11-14 16:14:42,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2024-11-18' --> 'data\processed_data\CVS\8-K_2024-11-18.md'
Converted 'data\edgar_documents\CVS\8-K_2024-12-02' --> 'data\processed_data\CVS\8-K_2024-12-02.md'


2025-11-14 16:14:42,869 - INFO - Going to convert document batch...
2025-11-14 16:14:42,871 - INFO - Processing document 8-K_2024-12-05
2025-11-14 16:14:42,930 - INFO - Finished converting document 8-K_2024-12-05 in 0.11 sec.
2025-11-14 16:14:42,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,010 - INFO - Going to convert document batch...
2025-11-14 16:14:43,011 - INFO - Processing document 8-K_2024-12-06
2025-11-14 16:14:43,043 - INFO - Finished converting document 8-K_2024-12-06 in 0.09 sec.
2025-11-14 16:14:43,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,092 - INFO - Going to convert document batch...
2025-11-14 16:14:43,094 - INFO - Processing document 8-K_2024-12-09
2025-11-14 16:14:43,134 - INFO - Finished converting document 8-K_2024-12-09 in 0.06 sec.


Converted 'data\edgar_documents\CVS\8-K_2024-12-05' --> 'data\processed_data\CVS\8-K_2024-12-05.md'
Converted 'data\edgar_documents\CVS\8-K_2024-12-06' --> 'data\processed_data\CVS\8-K_2024-12-06.md'


2025-11-14 16:14:43,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,224 - INFO - Going to convert document batch...
2025-11-14 16:14:43,226 - INFO - Processing document 8-K_2024-12-10
2025-11-14 16:14:43,298 - INFO - Finished converting document 8-K_2024-12-10 in 0.14 sec.


Converted 'data\edgar_documents\CVS\8-K_2024-12-09' --> 'data\processed_data\CVS\8-K_2024-12-09.md'
Converted 'data\edgar_documents\CVS\8-K_2024-12-10' --> 'data\processed_data\CVS\8-K_2024-12-10.md'


2025-11-14 16:14:43,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,393 - INFO - Going to convert document batch...
2025-11-14 16:14:43,395 - INFO - Processing document 8-K_2024-12-17
2025-11-14 16:14:43,455 - INFO - Finished converting document 8-K_2024-12-17 in 0.12 sec.
2025-11-14 16:14:43,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,530 - INFO - Going to convert document batch...
2025-11-14 16:14:43,531 - INFO - Processing document 8-K_2025-02-12
2025-11-14 16:14:43,577 - INFO - Finished converting document 8-K_2025-02-12 in 0.09 sec.
2025-11-14 16:14:43,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2024-12-17' --> 'data\processed_data\CVS\8-K_2024-12-17.md'
Converted 'data\edgar_documents\CVS\8-K_2025-02-12' --> 'data\processed_data\CVS\8-K_2025-02-12.md'


2025-11-14 16:14:43,676 - INFO - Going to convert document batch...
2025-11-14 16:14:43,678 - INFO - Processing document 8-K_2025-04-08
2025-11-14 16:14:43,737 - INFO - Finished converting document 8-K_2025-04-08 in 0.12 sec.
2025-11-14 16:14:43,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,836 - INFO - Going to convert document batch...
2025-11-14 16:14:43,838 - INFO - Processing document 8-K_2025-05-01
2025-11-14 16:14:43,892 - INFO - Finished converting document 8-K_2025-05-01 in 0.12 sec.
2025-11-14 16:14:43,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2025-04-08' --> 'data\processed_data\CVS\8-K_2025-04-08.md'
Converted 'data\edgar_documents\CVS\8-K_2025-05-01' --> 'data\processed_data\CVS\8-K_2025-05-01.md'


2025-11-14 16:14:43,980 - INFO - Going to convert document batch...
2025-11-14 16:14:43,983 - INFO - Processing document 8-K_2025-05-20
2025-11-14 16:14:44,042 - INFO - Finished converting document 8-K_2025-05-20 in 0.12 sec.
2025-11-14 16:14:44,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:44,141 - INFO - Going to convert document batch...
2025-11-14 16:14:44,143 - INFO - Processing document 8-K_2025-07-31
2025-11-14 16:14:44,196 - INFO - Finished converting document 8-K_2025-07-31 in 0.11 sec.


Converted 'data\edgar_documents\CVS\8-K_2025-05-20' --> 'data\processed_data\CVS\8-K_2025-05-20.md'
Converted 'data\edgar_documents\CVS\8-K_2025-07-31' --> 'data\processed_data\CVS\8-K_2025-07-31.md'


2025-11-14 16:14:44,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:44,306 - INFO - Going to convert document batch...
2025-11-14 16:14:44,308 - INFO - Processing document 8-K_2025-08-15
2025-11-14 16:14:44,369 - INFO - Finished converting document 8-K_2025-08-15 in 0.12 sec.
2025-11-14 16:14:44,432 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:44,452 - INFO - Going to convert document batch...
2025-11-14 16:14:44,452 - INFO - Processing document 8-K_2025-09-22
2025-11-14 16:14:44,498 - INFO - Finished converting document 8-K_2025-09-22 in 0.09 sec.
2025-11-14 16:14:44,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2025-08-15' --> 'data\processed_data\CVS\8-K_2025-08-15.md'
Converted 'data\edgar_documents\CVS\8-K_2025-09-22' --> 'data\processed_data\CVS\8-K_2025-09-22.md'


2025-11-14 16:14:44,594 - INFO - Going to convert document batch...
2025-11-14 16:14:44,597 - INFO - Processing document 8-K_2025-10-29
2025-11-14 16:14:44,645 - INFO - Finished converting document 8-K_2025-10-29 in 0.11 sec.
2025-11-14 16:14:44,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2025-10-29' --> 'data\processed_data\CVS\8-K_2025-10-29.md'


2025-11-14 16:14:47,000 - INFO - Going to convert document batch...
2025-11-14 16:14:47,002 - INFO - Processing document DEF-14A_2023-04-07
2025-11-14 16:16:04,149 - INFO - Finished converting document DEF-14A_2023-04-07 in 79.48 sec.
2025-11-14 16:16:09,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\DEF-14A_2023-04-07' --> 'data\processed_data\CVS\DEF-14A_2023-04-07.md'


2025-11-14 16:16:11,641 - INFO - Going to convert document batch...
2025-11-14 16:16:11,643 - INFO - Processing document DEF-14A_2024-04-05
2025-11-14 16:16:19,248 - INFO - Finished converting document DEF-14A_2024-04-05 in 10.09 sec.
2025-11-14 16:17:05,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\DEF-14A_2024-04-05' --> 'data\processed_data\CVS\DEF-14A_2024-04-05.md'


2025-11-14 16:17:09,088 - INFO - Going to convert document batch...
2025-11-14 16:17:09,090 - INFO - Processing document DEF-14A_2025-04-04
2025-11-14 16:17:16,296 - INFO - Finished converting document DEF-14A_2025-04-04 in 11.16 sec.
2025-11-14 16:17:21,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\DEF-14A_2025-04-04' --> 'data\processed_data\CVS\DEF-14A_2025-04-04.md'
Processed 103 new files. Errors: 9
Found 106 files to process in data\edgar_documents\CVX


2025-11-14 16:17:27,892 - INFO - Going to convert document batch...
2025-11-14 16:17:27,893 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:17:27,895 - INFO - Processing document 10-K_2023-02-23
2025-11-14 16:17:39,216 - INFO - Finished converting document 10-K_2023-02-23 in 17.59 sec.
2025-11-14 16:17:44,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-K_2023-02-23' --> 'data\processed_data\CVX\10-K_2023-02-23.md'


2025-11-14 16:17:49,306 - INFO - Going to convert document batch...
2025-11-14 16:17:49,309 - INFO - Processing document 10-K_2024-02-26
2025-11-14 16:18:01,471 - INFO - Finished converting document 10-K_2024-02-26 in 17.62 sec.
2025-11-14 16:18:06,454 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-K_2024-02-26' --> 'data\processed_data\CVX\10-K_2024-02-26.md'


2025-11-14 16:18:11,065 - INFO - Going to convert document batch...
2025-11-14 16:18:11,068 - INFO - Processing document 10-K_2025-02-21
2025-11-14 16:18:25,616 - INFO - Finished converting document 10-K_2025-02-21 in 19.36 sec.
2025-11-14 16:18:30,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-K_2025-02-21' --> 'data\processed_data\CVX\10-K_2025-02-21.md'


2025-11-14 16:18:32,075 - INFO - Going to convert document batch...
2025-11-14 16:18:32,077 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 16:18:34,559 - INFO - Finished converting document 10-Q_2023-05-04 in 3.73 sec.
2025-11-14 16:18:35,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2023-05-04' --> 'data\processed_data\CVX\10-Q_2023-05-04.md'


2025-11-14 16:18:37,793 - INFO - Going to convert document batch...
2025-11-14 16:18:37,796 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 16:18:41,677 - INFO - Finished converting document 10-Q_2023-08-03 in 6.03 sec.
2025-11-14 16:18:43,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2023-08-03' --> 'data\processed_data\CVX\10-Q_2023-08-03.md'


2025-11-14 16:18:46,151 - INFO - Going to convert document batch...
2025-11-14 16:18:46,153 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 16:18:49,790 - INFO - Finished converting document 10-Q_2023-11-02 in 6.25 sec.
2025-11-14 16:18:51,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2023-11-02' --> 'data\processed_data\CVX\10-Q_2023-11-02.md'


2025-11-14 16:18:52,539 - INFO - Going to convert document batch...
2025-11-14 16:18:52,540 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 16:18:55,545 - INFO - Finished converting document 10-Q_2024-05-02 in 3.95 sec.
2025-11-14 16:18:56,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2024-05-02' --> 'data\processed_data\CVX\10-Q_2024-05-02.md'


2025-11-14 16:18:58,527 - INFO - Going to convert document batch...
2025-11-14 16:18:58,529 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 16:19:01,680 - INFO - Finished converting document 10-Q_2024-08-07 in 4.92 sec.
2025-11-14 16:19:03,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2024-08-07' --> 'data\processed_data\CVX\10-Q_2024-08-07.md'


2025-11-14 16:19:05,991 - INFO - Going to convert document batch...
2025-11-14 16:19:05,993 - INFO - Processing document 10-Q_2024-11-07
2025-11-14 16:19:09,545 - INFO - Finished converting document 10-Q_2024-11-07 in 6.09 sec.
2025-11-14 16:19:11,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2024-11-07' --> 'data\processed_data\CVX\10-Q_2024-11-07.md'


2025-11-14 16:19:12,556 - INFO - Going to convert document batch...
2025-11-14 16:19:12,558 - INFO - Processing document 10-Q_2025-05-08
2025-11-14 16:19:14,203 - INFO - Finished converting document 10-Q_2025-05-08 in 2.52 sec.
2025-11-14 16:19:15,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2025-05-08' --> 'data\processed_data\CVX\10-Q_2025-05-08.md'


2025-11-14 16:19:18,256 - INFO - Going to convert document batch...
2025-11-14 16:19:18,258 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 16:19:21,988 - INFO - Finished converting document 10-Q_2025-08-07 in 6.44 sec.
2025-11-14 16:19:24,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2025-08-07' --> 'data\processed_data\CVX\10-Q_2025-08-07.md'


2025-11-14 16:19:26,761 - INFO - Going to convert document batch...
2025-11-14 16:19:26,763 - INFO - Processing document 10-Q_2025-11-06
2025-11-14 16:19:30,357 - INFO - Finished converting document 10-Q_2025-11-06 in 6.12 sec.
2025-11-14 16:19:32,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:32,708 - INFO - Going to convert document batch...
2025-11-14 16:19:32,710 - INFO - Processing document 4_2023-01-27


Converted 'data\edgar_documents\CVX\10-Q_2025-11-06' --> 'data\processed_data\CVX\10-Q_2025-11-06.md'


2025-11-14 16:19:32,828 - INFO - Finished converting document 4_2023-01-27 in 0.23 sec.
2025-11-14 16:19:33,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:33,053 - INFO - Going to convert document batch...
2025-11-14 16:19:33,056 - INFO - Processing document 4_2023-02-01
2025-11-14 16:19:33,136 - INFO - Finished converting document 4_2023-02-01 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2023-01-27' --> 'data\processed_data\CVX\4_2023-01-27.md'


2025-11-14 16:19:33,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:33,277 - INFO - Going to convert document batch...
2025-11-14 16:19:33,280 - INFO - Processing document 4_2023-02-02
2025-11-14 16:19:33,383 - INFO - Finished converting document 4_2023-02-02 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2023-02-01' --> 'data\processed_data\CVX\4_2023-02-01.md'


2025-11-14 16:19:33,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:33,553 - INFO - Going to convert document batch...
2025-11-14 16:19:33,555 - INFO - Processing document 4_2023-02-09
2025-11-14 16:19:33,649 - INFO - Finished converting document 4_2023-02-09 in 0.19 sec.


Converted 'data\edgar_documents\CVX\4_2023-02-02' --> 'data\processed_data\CVX\4_2023-02-02.md'


2025-11-14 16:19:33,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:33,795 - INFO - Going to convert document batch...
2025-11-14 16:19:33,797 - INFO - Processing document 4_2023-02-27
2025-11-14 16:19:33,867 - INFO - Finished converting document 4_2023-02-27 in 0.12 sec.


Converted 'data\edgar_documents\CVX\4_2023-02-09' --> 'data\processed_data\CVX\4_2023-02-09.md'


2025-11-14 16:19:34,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:34,259 - INFO - Going to convert document batch...
2025-11-14 16:19:34,261 - INFO - Processing document 4_2023-03-01


Converted 'data\edgar_documents\CVX\4_2023-02-27' --> 'data\processed_data\CVX\4_2023-02-27.md'


2025-11-14 16:19:34,354 - INFO - Finished converting document 4_2023-03-01 in 0.23 sec.
2025-11-14 16:19:34,512 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:34,514 - ERROR - Input document 4_2023-05-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:34,517 - INFO - Going to convert document batch...
2025-11-14 16:19:34,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:34,568 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\CVX\4_2023-03-01' --> 'data\processed_data\CVX\4_2023-03-01.md'
Error processing data\edgar_documents\CVX\4_2023-05-22: File format not allowed: data\edgar_documents\CVX\4_2023-05-22


2025-11-14 16:19:34,651 - INFO - Finished converting document 4_2023-05-30 in 0.14 sec.
2025-11-14 16:19:34,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:34,853 - INFO - Going to convert document batch...
2025-11-14 16:19:34,855 - INFO - Processing document 4_2023-06-02
2025-11-14 16:19:34,923 - INFO - Finished converting document 4_2023-06-02 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2023-05-30' --> 'data\processed_data\CVX\4_2023-05-30.md'


2025-11-14 16:19:35,100 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:35,103 - ERROR - Input document 4_2023-07-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:35,107 - INFO - Going to convert document batch...
2025-11-14 16:19:35,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:35,180 - INFO - Going to convert document batch...
2025-11-14 16:19:35,181 - INFO - Processing document 4_2023-08-07


Converted 'data\edgar_documents\CVX\4_2023-06-02' --> 'data\processed_data\CVX\4_2023-06-02.md'
Error processing data\edgar_documents\CVX\4_2023-07-07: File format not allowed: data\edgar_documents\CVX\4_2023-07-07


2025-11-14 16:19:35,447 - INFO - Finished converting document 4_2023-08-07 in 0.33 sec.
2025-11-14 16:19:35,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:35,642 - INFO - Going to convert document batch...
2025-11-14 16:19:35,644 - INFO - Processing document 4_2023-08-15
2025-11-14 16:19:35,724 - INFO - Finished converting document 4_2023-08-15 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2023-08-07' --> 'data\processed_data\CVX\4_2023-08-07.md'


2025-11-14 16:19:35,861 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:35,901 - INFO - Going to convert document batch...
2025-11-14 16:19:35,903 - INFO - Processing document 4_2023-08-29


Converted 'data\edgar_documents\CVX\4_2023-08-15' --> 'data\processed_data\CVX\4_2023-08-15.md'


2025-11-14 16:19:36,007 - INFO - Finished converting document 4_2023-08-29 in 0.19 sec.
2025-11-14 16:19:36,284 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:36,287 - ERROR - Input document 4_2023-10-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))


Converted 'data\edgar_documents\CVX\4_2023-08-29' --> 'data\processed_data\CVX\4_2023-08-29.md'


2025-11-14 16:19:36,298 - INFO - Going to convert document batch...
2025-11-14 16:19:36,368 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:36,370 - ERROR - Input document 4_2023-10-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:36,373 - INFO - Going to convert document batch...
2025-11-14 16:19:36,425 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:36,427 - ERROR - Input document 4_2023-10-26 with format None does not matc

Error processing data\edgar_documents\CVX\4_2023-10-23: File format not allowed: data\edgar_documents\CVX\4_2023-10-23
Error processing data\edgar_documents\CVX\4_2023-10-24: File format not allowed: data\edgar_documents\CVX\4_2023-10-24
Error processing data\edgar_documents\CVX\4_2023-10-26: File format not allowed: data\edgar_documents\CVX\4_2023-10-26
Error processing data\edgar_documents\CVX\4_2023-10-27: File format not allowed: data\edgar_documents\CVX\4_2023-10-27


2025-11-14 16:19:36,481 - ERROR - Input document 4_2023-11-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:36,485 - INFO - Going to convert document batch...
2025-11-14 16:19:36,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:36,548 - INFO - Going to convert document batch...
2025-11-14 16:19:36,550 - INFO - Processing document 4_2023-11-29
2025-11-14 16:19:36,640 - INFO - Finished converting document 4_2023-11-29 in 0.16 sec.


Error processing data\edgar_documents\CVX\4_2023-11-02: File format not allowed: data\edgar_documents\CVX\4_2023-11-02


2025-11-14 16:19:36,875 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:36,876 - ERROR - Input document 4_2023-12-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:36,881 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVX\4_2023-11-29' --> 'data\processed_data\CVX\4_2023-11-29.md'
Error processing data\edgar_documents\CVX\4_2023-12-08: File format not allowed: data\edgar_documents\CVX\4_2023-12-08


2025-11-14 16:19:36,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:37,047 - INFO - Going to convert document batch...
2025-11-14 16:19:37,049 - INFO - Processing document 4_2023-12-20
2025-11-14 16:19:37,213 - INFO - Finished converting document 4_2023-12-20 in 0.34 sec.
2025-11-14 16:19:37,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:37,406 - INFO - Going to convert document batch...
2025-11-14 16:19:37,408 - INFO - Processing document 4_2024-02-02
2025-11-14 16:19:37,477 - INFO - Finished converting document 4_2024-02-02 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2023-12-20' --> 'data\processed_data\CVX\4_2023-12-20.md'


2025-11-14 16:19:37,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:37,634 - INFO - Going to convert document batch...
2025-11-14 16:19:37,636 - INFO - Processing document 4_2024-02-08
2025-11-14 16:19:37,730 - INFO - Finished converting document 4_2024-02-08 in 0.19 sec.


Converted 'data\edgar_documents\CVX\4_2024-02-02' --> 'data\processed_data\CVX\4_2024-02-02.md'


2025-11-14 16:19:37,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:37,886 - INFO - Going to convert document batch...
2025-11-14 16:19:37,888 - INFO - Processing document 4_2024-03-06
2025-11-14 16:19:38,001 - INFO - Finished converting document 4_2024-03-06 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2024-02-08' --> 'data\processed_data\CVX\4_2024-02-08.md'


2025-11-14 16:19:38,143 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:38,145 - ERROR - Input document 4_2024-03-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:38,146 - INFO - Going to convert document batch...
2025-11-14 16:19:38,168 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:38,170 - ERROR - Input document 4_2024-04-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\CVX\4_2024-03-06' --> 'data\processed_data\CVX\4_2024-03-06.md'
Error processing data\edgar_documents\CVX\4_2024-03-22: File format not allowed: data\edgar_documents\CVX\4_2024-03-22
Error processing data\edgar_documents\CVX\4_2024-04-03: File format not allowed: data\edgar_documents\CVX\4_2024-04-03


2025-11-14 16:19:38,333 - INFO - Finished converting document 4_2024-04-04 in 0.16 sec.
2025-11-14 16:19:38,620 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\CVX\4_2024-04-04' --> 'data\processed_data\CVX\4_2024-04-04.md'


2025-11-14 16:19:38,621 - ERROR - Input document 4_2024-04-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:38,635 - INFO - Going to convert document batch...
2025-11-14 16:19:38,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:38,706 - INFO - Going to convert document batch...
2025-11-14 16:19:38,708 - INFO - Processing document 4_2024-04-29
2025-11-14 16:19:38,798 - INFO - Finished converting document 4_2024-04-29 in 0.16 sec.


Error processing data\edgar_documents\CVX\4_2024-04-26: File format not allowed: data\edgar_documents\CVX\4_2024-04-26


2025-11-14 16:19:38,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:38,959 - INFO - Going to convert document batch...
2025-11-14 16:19:38,962 - INFO - Processing document 4_2024-05-06
2025-11-14 16:19:39,048 - INFO - Finished converting document 4_2024-05-06 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2024-04-29' --> 'data\processed_data\CVX\4_2024-04-29.md'


2025-11-14 16:19:39,167 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:39,202 - INFO - Going to convert document batch...
2025-11-14 16:19:39,204 - INFO - Processing document 4_2024-05-13
2025-11-14 16:19:39,284 - INFO - Finished converting document 4_2024-05-13 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2024-05-06' --> 'data\processed_data\CVX\4_2024-05-06.md'


2025-11-14 16:19:39,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:39,453 - INFO - Going to convert document batch...
2025-11-14 16:19:39,456 - INFO - Processing document 4_2024-05-23
2025-11-14 16:19:39,552 - INFO - Finished converting document 4_2024-05-23 in 0.19 sec.


Converted 'data\edgar_documents\CVX\4_2024-05-13' --> 'data\processed_data\CVX\4_2024-05-13.md'


2025-11-14 16:19:39,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:39,691 - INFO - Going to convert document batch...
2025-11-14 16:19:39,693 - INFO - Processing document 4_2024-05-28
2025-11-14 16:19:39,788 - INFO - Finished converting document 4_2024-05-28 in 0.14 sec.


Converted 'data\edgar_documents\CVX\4_2024-05-23' --> 'data\processed_data\CVX\4_2024-05-23.md'


2025-11-14 16:19:39,898 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:39,925 - INFO - Going to convert document batch...
2025-11-14 16:19:39,927 - INFO - Processing document 4_2024-05-30
2025-11-14 16:19:40,013 - INFO - Finished converting document 4_2024-05-30 in 0.14 sec.


Converted 'data\edgar_documents\CVX\4_2024-05-28' --> 'data\processed_data\CVX\4_2024-05-28.md'


2025-11-14 16:19:40,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:40,171 - INFO - Going to convert document batch...
2025-11-14 16:19:40,173 - INFO - Processing document 4_2024-08-08


Converted 'data\edgar_documents\CVX\4_2024-05-30' --> 'data\processed_data\CVX\4_2024-05-30.md'


2025-11-14 16:19:40,514 - INFO - Finished converting document 4_2024-08-08 in 0.42 sec.
2025-11-14 16:19:40,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:40,654 - INFO - Going to convert document batch...
2025-11-14 16:19:40,655 - INFO - Processing document 4_2024-08-22
2025-11-14 16:19:40,718 - INFO - Finished converting document 4_2024-08-22 in 0.11 sec.


Converted 'data\edgar_documents\CVX\4_2024-08-08' --> 'data\processed_data\CVX\4_2024-08-08.md'
Converted 'data\edgar_documents\CVX\4_2024-08-22' --> 'data\processed_data\CVX\4_2024-08-22.md'


2025-11-14 16:19:40,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:40,857 - INFO - Going to convert document batch...
2025-11-14 16:19:40,859 - INFO - Processing document 4_2024-09-04
2025-11-14 16:19:40,940 - INFO - Finished converting document 4_2024-09-04 in 0.14 sec.
2025-11-14 16:19:41,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:41,153 - INFO - Going to convert document batch...
2025-11-14 16:19:41,155 - INFO - Processing document 4_2024-11-18
2025-11-14 16:19:41,233 - INFO - Finished converting document 4_2024-11-18 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2024-09-04' --> 'data\processed_data\CVX\4_2024-09-04.md'


2025-11-14 16:19:41,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:41,382 - INFO - Going to convert document batch...
2025-11-14 16:19:41,385 - INFO - Processing document 4_2024-12-04
2025-11-14 16:19:41,470 - INFO - Finished converting document 4_2024-12-04 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2024-11-18' --> 'data\processed_data\CVX\4_2024-11-18.md'


2025-11-14 16:19:41,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:41,642 - INFO - Going to convert document batch...
2025-11-14 16:19:41,644 - INFO - Processing document 4_2024-12-19


Converted 'data\edgar_documents\CVX\4_2024-12-04' --> 'data\processed_data\CVX\4_2024-12-04.md'


2025-11-14 16:19:41,812 - INFO - Finished converting document 4_2024-12-19 in 0.27 sec.
2025-11-14 16:19:42,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:42,133 - INFO - Going to convert document batch...
2025-11-14 16:19:42,135 - INFO - Processing document 4_2025-02-04


Converted 'data\edgar_documents\CVX\4_2024-12-19' --> 'data\processed_data\CVX\4_2024-12-19.md'


2025-11-14 16:19:42,248 - INFO - Finished converting document 4_2025-02-04 in 0.22 sec.
2025-11-14 16:19:42,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:42,440 - INFO - Going to convert document batch...
2025-11-14 16:19:42,443 - INFO - Processing document 4_2025-02-06
2025-11-14 16:19:42,530 - INFO - Finished converting document 4_2025-02-06 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2025-02-04' --> 'data\processed_data\CVX\4_2025-02-04.md'


2025-11-14 16:19:42,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:42,778 - INFO - Going to convert document batch...
2025-11-14 16:19:42,781 - INFO - Processing document 4_2025-02-11


Converted 'data\edgar_documents\CVX\4_2025-02-06' --> 'data\processed_data\CVX\4_2025-02-06.md'


2025-11-14 16:19:42,905 - INFO - Finished converting document 4_2025-02-11 in 0.30 sec.
2025-11-14 16:19:43,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:43,112 - INFO - Going to convert document batch...
2025-11-14 16:19:43,114 - INFO - Processing document 4_2025-02-12


Converted 'data\edgar_documents\CVX\4_2025-02-11' --> 'data\processed_data\CVX\4_2025-02-11.md'


2025-11-14 16:19:43,228 - INFO - Finished converting document 4_2025-02-12 in 0.22 sec.
2025-11-14 16:19:43,354 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:43,356 - ERROR - Input document 4_2025-02-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:43,359 - INFO - Going to convert document batch...
2025-11-14 16:19:43,383 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:43,385 - ERROR - Input document 4_2025-02-25 with forma

Converted 'data\edgar_documents\CVX\4_2025-02-12' --> 'data\processed_data\CVX\4_2025-02-12.md'
Error processing data\edgar_documents\CVX\4_2025-02-24: File format not allowed: data\edgar_documents\CVX\4_2025-02-24
Error processing data\edgar_documents\CVX\4_2025-02-25: File format not allowed: data\edgar_documents\CVX\4_2025-02-25


2025-11-14 16:19:43,544 - INFO - Finished converting document 4_2025-02-27 in 0.16 sec.
2025-11-14 16:19:43,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:43,786 - INFO - Going to convert document batch...
2025-11-14 16:19:43,789 - INFO - Processing document 4_2025-03-05
2025-11-14 16:19:43,884 - INFO - Finished converting document 4_2025-03-05 in 0.19 sec.


Converted 'data\edgar_documents\CVX\4_2025-02-27' --> 'data\processed_data\CVX\4_2025-02-27.md'


2025-11-14 16:19:44,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:44,061 - INFO - Going to convert document batch...
2025-11-14 16:19:44,063 - INFO - Processing document 4_2025-05-29
2025-11-14 16:19:44,145 - INFO - Finished converting document 4_2025-05-29 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2025-03-05' --> 'data\processed_data\CVX\4_2025-03-05.md'


2025-11-14 16:19:44,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:44,282 - INFO - Going to convert document batch...
2025-11-14 16:19:44,284 - INFO - Processing document 4_2025-06-04
2025-11-14 16:19:44,363 - INFO - Finished converting document 4_2025-06-04 in 0.12 sec.


Converted 'data\edgar_documents\CVX\4_2025-05-29' --> 'data\processed_data\CVX\4_2025-05-29.md'


2025-11-14 16:19:44,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:44,605 - INFO - Going to convert document batch...
2025-11-14 16:19:44,609 - INFO - Processing document 4_2025-07-22


Converted 'data\edgar_documents\CVX\4_2025-06-04' --> 'data\processed_data\CVX\4_2025-06-04.md'


2025-11-14 16:19:44,727 - INFO - Finished converting document 4_2025-07-22 in 0.27 sec.
2025-11-14 16:19:44,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:44,884 - INFO - Going to convert document batch...
2025-11-14 16:19:44,886 - INFO - Processing document 4_2025-07-30
2025-11-14 16:19:44,991 - INFO - Finished converting document 4_2025-07-30 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2025-07-22' --> 'data\processed_data\CVX\4_2025-07-22.md'


2025-11-14 16:19:45,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:45,141 - INFO - Going to convert document batch...
2025-11-14 16:19:45,143 - INFO - Processing document 4_2025-08-08
2025-11-14 16:19:45,212 - INFO - Finished converting document 4_2025-08-08 in 0.11 sec.


Converted 'data\edgar_documents\CVX\4_2025-07-30' --> 'data\processed_data\CVX\4_2025-07-30.md'


2025-11-14 16:19:45,561 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:45,564 - ERROR - Input document 4_2025-08-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:45,569 - INFO - Going to convert document batch...
2025-11-14 16:19:45,596 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\CVX\4_2025-08-08' --> 'data\processed_data\CVX\4_2025-08-08.md'
Error processing data\edgar_documents\CVX\4_2025-08-11: File format not allowed: data\edgar_documents\CVX\4_2025-08-11


2025-11-14 16:19:45,597 - ERROR - Input document 4_2025-08-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:45,602 - INFO - Going to convert document batch...
2025-11-14 16:19:45,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:45,673 - INFO - Going to convert document batch...
2025-11-14 16:19:45,675 - INFO - Processing document 4_2025-08-26
2025-11-14 16:19:45,796 - INFO - Finished converting document 4_2025-08-26 in 0.19 sec.


Error processing data\edgar_documents\CVX\4_2025-08-12: File format not allowed: data\edgar_documents\CVX\4_2025-08-12


2025-11-14 16:19:45,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:45,974 - INFO - Going to convert document batch...
2025-11-14 16:19:45,975 - INFO - Processing document 4_2025-09-03


Converted 'data\edgar_documents\CVX\4_2025-08-26' --> 'data\processed_data\CVX\4_2025-08-26.md'


2025-11-14 16:19:46,162 - INFO - Finished converting document 4_2025-09-03 in 0.23 sec.
2025-11-14 16:19:46,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:46,389 - INFO - Going to convert document batch...
2025-11-14 16:19:46,391 - INFO - Processing document 8-K_2023-01-27
2025-11-14 16:19:46,489 - INFO - Finished converting document 8-K_2023-01-27 in 0.20 sec.


Converted 'data\edgar_documents\CVX\4_2025-09-03' --> 'data\processed_data\CVX\4_2025-09-03.md'


2025-11-14 16:19:46,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:46,633 - INFO - Going to convert document batch...
2025-11-14 16:19:46,635 - INFO - Processing document 8-K_2023-04-28


Converted 'data\edgar_documents\CVX\8-K_2023-01-27' --> 'data\processed_data\CVX\8-K_2023-01-27.md'


2025-11-14 16:19:47,658 - INFO - Finished converting document 8-K_2023-04-28 in 1.12 sec.
2025-11-14 16:19:47,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:47,793 - INFO - Going to convert document batch...
2025-11-14 16:19:47,795 - INFO - Processing document 8-K_2023-05-22
2025-11-14 16:19:47,868 - INFO - Finished converting document 8-K_2023-05-22 in 0.16 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-04-28' --> 'data\processed_data\CVX\8-K_2023-04-28.md'


2025-11-14 16:19:48,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\8-K_2023-05-22' --> 'data\processed_data\CVX\8-K_2023-05-22.md'


2025-11-14 16:19:48,211 - INFO - Going to convert document batch...
2025-11-14 16:19:48,212 - INFO - Processing document 8-K_2023-06-02
2025-11-14 16:19:48,427 - INFO - Finished converting document 8-K_2023-06-02 in 0.45 sec.
2025-11-14 16:19:48,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:48,707 - INFO - Going to convert document batch...
2025-11-14 16:19:48,709 - INFO - Processing document 8-K_2023-07-24
2025-11-14 16:19:48,767 - INFO - Finished converting document 8-K_2023-07-24 in 0.16 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-06-02' --> 'data\processed_data\CVX\8-K_2023-06-02.md'


2025-11-14 16:19:48,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:48,883 - INFO - Going to convert document batch...
2025-11-14 16:19:48,884 - INFO - Processing document 8-K_2023-07-26
2025-11-14 16:19:48,950 - INFO - Finished converting document 8-K_2023-07-26 in 0.14 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-07-24' --> 'data\processed_data\CVX\8-K_2023-07-24.md'
Converted 'data\edgar_documents\CVX\8-K_2023-07-26' --> 'data\processed_data\CVX\8-K_2023-07-26.md'


2025-11-14 16:19:49,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,070 - INFO - Going to convert document batch...
2025-11-14 16:19:49,072 - INFO - Processing document 8-K_2023-07-28
2025-11-14 16:19:49,151 - INFO - Finished converting document 8-K_2023-07-28 in 0.17 sec.
2025-11-14 16:19:49,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,239 - INFO - Going to convert document batch...
2025-11-14 16:19:49,240 - INFO - Processing document 8-K_2023-08-07
2025-11-14 16:19:49,292 - INFO - Finished converting document 8-K_2023-08-07 in 0.11 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-07-28' --> 'data\processed_data\CVX\8-K_2023-07-28.md'
Converted 'data\edgar_documents\CVX\8-K_2023-08-07' --> 'data\processed_data\CVX\8-K_2023-08-07.md'


2025-11-14 16:19:49,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,426 - INFO - Going to convert document batch...
2025-11-14 16:19:49,427 - INFO - Processing document 8-K_2023-10-23
2025-11-14 16:19:49,539 - INFO - Finished converting document 8-K_2023-10-23 in 0.22 sec.
2025-11-14 16:19:49,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,724 - INFO - Going to convert document batch...
2025-11-14 16:19:49,725 - INFO - Processing document 8-K_2023-10-27
2025-11-14 16:19:49,789 - INFO - Finished converting document 8-K_2023-10-27 in 0.14 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-10-23' --> 'data\processed_data\CVX\8-K_2023-10-23.md'
Converted 'data\edgar_documents\CVX\8-K_2023-10-27' --> 'data\processed_data\CVX\8-K_2023-10-27.md'


2025-11-14 16:19:49,890 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,931 - INFO - Going to convert document batch...
2025-11-14 16:19:49,934 - INFO - Processing document 8-K_2023-11-24
2025-11-14 16:19:49,996 - INFO - Finished converting document 8-K_2023-11-24 in 0.17 sec.
2025-11-14 16:19:50,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,114 - INFO - Going to convert document batch...
2025-11-14 16:19:50,117 - INFO - Processing document 8-K_2023-12-08
2025-11-14 16:19:50,194 - INFO - Finished converting document 8-K_2023-12-08 in 0.14 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-11-24' --> 'data\processed_data\CVX\8-K_2023-11-24.md'


2025-11-14 16:19:50,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,397 - INFO - Going to convert document batch...
2025-11-14 16:19:50,398 - INFO - Processing document 8-K_2024-01-02
2025-11-14 16:19:50,436 - INFO - Finished converting document 8-K_2024-01-02 in 0.09 sec.
2025-11-14 16:19:50,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,516 - INFO - Going to convert document batch...
2025-11-14 16:19:50,517 - INFO - Processing document 8-K_2024-02-02


Converted 'data\edgar_documents\CVX\8-K_2023-12-08' --> 'data\processed_data\CVX\8-K_2023-12-08.md'
Converted 'data\edgar_documents\CVX\8-K_2024-01-02' --> 'data\processed_data\CVX\8-K_2024-01-02.md'


2025-11-14 16:19:50,595 - INFO - Finished converting document 8-K_2024-02-02 in 0.14 sec.
2025-11-14 16:19:50,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,716 - INFO - Going to convert document batch...
2025-11-14 16:19:50,717 - INFO - Processing document 8-K_2024-04-26
2025-11-14 16:19:50,749 - INFO - Finished converting document 8-K_2024-04-26 in 0.11 sec.
2025-11-14 16:19:50,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,811 - INFO - Going to convert document batch...
2025-11-14 16:19:50,812 - INFO - Processing document 8-K_2024-05-31


Converted 'data\edgar_documents\CVX\8-K_2024-02-02' --> 'data\processed_data\CVX\8-K_2024-02-02.md'
Converted 'data\edgar_documents\CVX\8-K_2024-04-26' --> 'data\processed_data\CVX\8-K_2024-04-26.md'


2025-11-14 16:19:50,867 - INFO - Finished converting document 8-K_2024-05-31 in 0.09 sec.
2025-11-14 16:19:50,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,995 - INFO - Going to convert document batch...
2025-11-14 16:19:50,996 - INFO - Processing document 8-K_2024-07-31
2025-11-14 16:19:51,023 - INFO - Finished converting document 8-K_2024-07-31 in 0.06 sec.
2025-11-14 16:19:51,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,097 - INFO - Going to convert document batch...
2025-11-14 16:19:51,098 - INFO - Processing document 8-K_2024-08-02
2025-11-14 16:19:51,133 - INFO - Finished converting document 8-K_2024-08-02 in 0.08 sec.


Converted 'data\edgar_documents\CVX\8-K_2024-05-31' --> 'data\processed_data\CVX\8-K_2024-05-31.md'
Converted 'data\edgar_documents\CVX\8-K_2024-07-31' --> 'data\processed_data\CVX\8-K_2024-07-31.md'


2025-11-14 16:19:51,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,192 - INFO - Going to convert document batch...
2025-11-14 16:19:51,195 - INFO - Processing document 8-K_2024-09-30
2025-11-14 16:19:51,229 - INFO - Finished converting document 8-K_2024-09-30 in 0.08 sec.
2025-11-14 16:19:51,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,300 - INFO - Going to convert document batch...
2025-11-14 16:19:51,302 - INFO - Processing document 8-K_2024-10-07
2025-11-14 16:19:51,340 - INFO - Finished converting document 8-K_2024-10-07 in 0.09 sec.


Converted 'data\edgar_documents\CVX\8-K_2024-08-02' --> 'data\processed_data\CVX\8-K_2024-08-02.md'
Converted 'data\edgar_documents\CVX\8-K_2024-09-30' --> 'data\processed_data\CVX\8-K_2024-09-30.md'


2025-11-14 16:19:51,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,394 - INFO - Going to convert document batch...
2025-11-14 16:19:51,395 - INFO - Processing document 8-K_2024-11-01
2025-11-14 16:19:51,429 - INFO - Finished converting document 8-K_2024-11-01 in 0.06 sec.
2025-11-14 16:19:51,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,474 - INFO - Going to convert document batch...
2025-11-14 16:19:51,475 - INFO - Processing document 8-K_2024-12-10
2025-11-14 16:19:51,511 - INFO - Finished converting document 8-K_2024-12-10 in 0.08 sec.
2025-11-14 16:19:51,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\8-K_2024-10-07' --> 'data\processed_data\CVX\8-K_2024-10-07.md'
Converted 'data\edgar_documents\CVX\8-K_2024-11-01' --> 'data\processed_data\CVX\8-K_2024-11-01.md'
Converted 'data\edgar_documents\CVX\8-K_2024-12-10' --> 'data\processed_data\CVX\8-K_2024-12-10.md'


2025-11-14 16:19:51,566 - INFO - Going to convert document batch...
2025-11-14 16:19:51,567 - INFO - Processing document 8-K_2025-01-31
2025-11-14 16:19:51,614 - INFO - Finished converting document 8-K_2025-01-31 in 0.08 sec.
2025-11-14 16:19:51,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,734 - INFO - Going to convert document batch...
2025-11-14 16:19:51,735 - INFO - Processing document 8-K_2025-02-26
2025-11-14 16:19:51,764 - INFO - Finished converting document 8-K_2025-02-26 in 0.11 sec.
2025-11-14 16:19:51,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,814 - INFO - Going to convert document batch...
2025-11-14 16:19:51,815 - INFO - Processing document 8-K_2025-03-17
2025-11-14 16:19:51,839 - INFO - Finished converting document 8-K_2025-03-17 in 0.06 sec.


Converted 'data\edgar_documents\CVX\8-K_2025-01-31' --> 'data\processed_data\CVX\8-K_2025-01-31.md'
Converted 'data\edgar_documents\CVX\8-K_2025-02-26' --> 'data\processed_data\CVX\8-K_2025-02-26.md'


2025-11-14 16:19:51,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,898 - INFO - Going to convert document batch...
2025-11-14 16:19:51,899 - INFO - Processing document 8-K_2025-05-02
2025-11-14 16:19:51,947 - INFO - Finished converting document 8-K_2025-05-02 in 0.09 sec.
2025-11-14 16:19:52,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,034 - INFO - Going to convert document batch...
2025-11-14 16:19:52,035 - INFO - Processing document 8-K_2025-05-30


Converted 'data\edgar_documents\CVX\8-K_2025-03-17' --> 'data\processed_data\CVX\8-K_2025-03-17.md'
Converted 'data\edgar_documents\CVX\8-K_2025-05-02' --> 'data\processed_data\CVX\8-K_2025-05-02.md'


2025-11-14 16:19:52,085 - INFO - Finished converting document 8-K_2025-05-30 in 0.11 sec.
2025-11-14 16:19:52,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,216 - INFO - Going to convert document batch...
2025-11-14 16:19:52,217 - INFO - Processing document 8-K_2025-07-18
2025-11-14 16:19:52,248 - INFO - Finished converting document 8-K_2025-07-18 in 0.11 sec.
2025-11-14 16:19:52,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,317 - INFO - Going to convert document batch...
2025-11-14 16:19:52,318 - INFO - Processing document 8-K_2025-07-29


Converted 'data\edgar_documents\CVX\8-K_2025-05-30' --> 'data\processed_data\CVX\8-K_2025-05-30.md'
Converted 'data\edgar_documents\CVX\8-K_2025-07-18' --> 'data\processed_data\CVX\8-K_2025-07-18.md'


2025-11-14 16:19:52,375 - INFO - Finished converting document 8-K_2025-07-29 in 0.11 sec.
2025-11-14 16:19:52,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,527 - INFO - Going to convert document batch...
2025-11-14 16:19:52,532 - INFO - Processing document 8-K_2025-08-01
2025-11-14 16:19:52,572 - INFO - Finished converting document 8-K_2025-08-01 in 0.16 sec.


Converted 'data\edgar_documents\CVX\8-K_2025-07-29' --> 'data\processed_data\CVX\8-K_2025-07-29.md'
Converted 'data\edgar_documents\CVX\8-K_2025-08-01' --> 'data\processed_data\CVX\8-K_2025-08-01.md'


2025-11-14 16:19:52,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,640 - INFO - Going to convert document batch...
2025-11-14 16:19:52,642 - INFO - Processing document 8-K_2025-08-13
2025-11-14 16:19:52,679 - INFO - Finished converting document 8-K_2025-08-13 in 0.09 sec.
2025-11-14 16:19:52,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,732 - INFO - Going to convert document batch...
2025-11-14 16:19:52,732 - INFO - Processing document 8-K_2025-09-25
2025-11-14 16:19:52,763 - INFO - Finished converting document 8-K_2025-09-25 in 0.06 sec.
2025-11-14 16:19:52,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,812 - INFO - Going to convert document batch...
2025-11-14 16:19:52,813 - INFO - Processing document 8-K_2025-10-31
2025-11-14 16:19:52,841 - INFO - Finished converting document 8-K_2025-10-31 in 0.06 sec.
2025-11-14 16:19:52,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\CVX\8-K_2025-08-13' --> 'data\processed_data\CVX\8-K_2025-08-13.md'
Converted 'data\edgar_documents\CVX\8-K_2025-09-25' --> 'data\processed_data\CVX\8-K_2025-09-25.md'
Converted 'data\edgar_documents\CVX\8-K_2025-10-31' --> 'data\processed_data\CVX\8-K_2025-10-31.md'


2025-11-14 16:19:52,889 - INFO - Processing document 8-K_2025-11-03
2025-11-14 16:19:52,915 - INFO - Finished converting document 8-K_2025-11-03 in 0.05 sec.
2025-11-14 16:19:53,017 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:53,018 - ERROR - Input document DEF-14A_2023-04-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:53,023 - INFO - Going to convert document batch...
2025-11-14 16:19:53,109 - INFO - detected formats:

Converted 'data\edgar_documents\CVX\8-K_2025-11-03' --> 'data\processed_data\CVX\8-K_2025-11-03.md'
Error processing data\edgar_documents\CVX\DEF-14A_2023-04-12: File format not allowed: data\edgar_documents\CVX\DEF-14A_2023-04-12
Error processing data\edgar_documents\CVX\DEF-14A_2024-04-10: File format not allowed: data\edgar_documents\CVX\DEF-14A_2024-04-10


2025-11-14 16:19:53,198 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:53,200 - ERROR - Input document DEF-14A_2025-04-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:53,204 - INFO - Going to convert document batch...


Error processing data\edgar_documents\CVX\DEF-14A_2025-04-09: File format not allowed: data\edgar_documents\CVX\DEF-14A_2025-04-09
Processed 88 new files. Errors: 18
Found 75 files to process in data\edgar_documents\DE


2025-11-14 16:19:53,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:57,472 - INFO - Going to convert document batch...
2025-11-14 16:19:57,474 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:19:57,475 - INFO - Processing document 10-K_2023-12-15
2025-11-14 16:20:09,155 - INFO - Finished converting document 10-K_2023-12-15 in 15.94 sec.


Converted 'data\edgar_documents\DE\10-K_2023-12-15' --> 'data\processed_data\DE\10-K_2023-12-15.md'


2025-11-14 16:20:11,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:20:15,862 - INFO - Going to convert document batch...
2025-11-14 16:20:15,863 - INFO - Processing document 10-K_2024-12-12
2025-11-14 16:20:28,879 - INFO - Finished converting document 10-K_2024-12-12 in 17.52 sec.
2025-11-14 16:20:30,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-K_2024-12-12' --> 'data\processed_data\DE\10-K_2024-12-12.md'


2025-11-14 16:20:32,851 - INFO - Going to convert document batch...
2025-11-14 16:20:32,852 - INFO - Processing document 10-Q_2023-02-23
2025-11-14 16:20:35,570 - INFO - Finished converting document 10-Q_2023-02-23 in 5.19 sec.
2025-11-14 16:20:36,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2023-02-23' --> 'data\processed_data\DE\10-Q_2023-02-23.md'


2025-11-14 16:20:40,030 - INFO - Going to convert document batch...
2025-11-14 16:20:40,031 - INFO - Processing document 10-Q_2023-06-01
2025-11-14 16:20:43,161 - INFO - Finished converting document 10-Q_2023-06-01 in 7.05 sec.
2025-11-14 16:20:44,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2023-06-01' --> 'data\processed_data\DE\10-Q_2023-06-01.md'


2025-11-14 16:20:47,248 - INFO - Going to convert document batch...
2025-11-14 16:20:47,250 - INFO - Processing document 10-Q_2023-08-31
2025-11-14 16:20:50,657 - INFO - Finished converting document 10-Q_2023-08-31 in 6.75 sec.
2025-11-14 16:20:51,614 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2023-08-31' --> 'data\processed_data\DE\10-Q_2023-08-31.md'


2025-11-14 16:20:54,136 - INFO - Going to convert document batch...
2025-11-14 16:20:54,137 - INFO - Processing document 10-Q_2024-02-29
2025-11-14 16:20:56,834 - INFO - Finished converting document 10-Q_2024-02-29 in 5.34 sec.
2025-11-14 16:20:57,530 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2024-02-29' --> 'data\processed_data\DE\10-Q_2024-02-29.md'


2025-11-14 16:21:00,567 - INFO - Going to convert document batch...
2025-11-14 16:21:00,568 - INFO - Processing document 10-Q_2024-05-30
2025-11-14 16:21:04,370 - INFO - Finished converting document 10-Q_2024-05-30 in 6.97 sec.
2025-11-14 16:21:05,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2024-05-30' --> 'data\processed_data\DE\10-Q_2024-05-30.md'


2025-11-14 16:21:08,180 - INFO - Going to convert document batch...
2025-11-14 16:21:08,181 - INFO - Processing document 10-Q_2024-08-29
2025-11-14 16:21:11,398 - INFO - Finished converting document 10-Q_2024-08-29 in 6.31 sec.
2025-11-14 16:21:12,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2024-08-29' --> 'data\processed_data\DE\10-Q_2024-08-29.md'


2025-11-14 16:21:15,133 - INFO - Going to convert document batch...
2025-11-14 16:21:15,134 - INFO - Processing document 10-Q_2025-02-27
2025-11-14 16:21:17,452 - INFO - Finished converting document 10-Q_2025-02-27 in 4.97 sec.
2025-11-14 16:21:18,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2025-02-27' --> 'data\processed_data\DE\10-Q_2025-02-27.md'


2025-11-14 16:21:21,070 - INFO - Going to convert document batch...
2025-11-14 16:21:21,072 - INFO - Processing document 10-Q_2025-05-29
2025-11-14 16:21:23,846 - INFO - Finished converting document 10-Q_2025-05-29 in 5.72 sec.
2025-11-14 16:21:24,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2025-05-29' --> 'data\processed_data\DE\10-Q_2025-05-29.md'


2025-11-14 16:21:27,693 - INFO - Going to convert document batch...
2025-11-14 16:21:27,694 - INFO - Processing document 10-Q_2025-08-28
2025-11-14 16:21:30,403 - INFO - Finished converting document 10-Q_2025-08-28 in 6.02 sec.
2025-11-14 16:21:31,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:31,135 - INFO - Going to convert document batch...
2025-11-14 16:21:31,136 - INFO - Processing document 4_2023-03-02
2025-11-14 16:21:31,172 - INFO - Finished converting document 4_2023-03-02 in 0.09 sec.
2025-11-14 16:21:31,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:31,239 - INFO - Going to convert document batch...
2025-11-14 16:21:31,240 - INFO - Processing document 4_2023-05-30
2025-11-14 16:21:31,278 - INFO - Finished converting document 4_2023-05-30 in 0.08 sec.


Converted 'data\edgar_documents\DE\10-Q_2025-08-28' --> 'data\processed_data\DE\10-Q_2025-08-28.md'
Converted 'data\edgar_documents\DE\4_2023-03-02' --> 'data\processed_data\DE\4_2023-03-02.md'


2025-11-14 16:21:31,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:31,356 - INFO - Going to convert document batch...
2025-11-14 16:21:31,358 - INFO - Processing document 4_2023-06-05
2025-11-14 16:21:31,406 - INFO - Finished converting document 4_2023-06-05 in 0.09 sec.
2025-11-14 16:21:31,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:31,474 - INFO - Going to convert document batch...
2025-11-14 16:21:31,475 - INFO - Processing document 4_2023-06-07


Converted 'data\edgar_documents\DE\4_2023-05-30' --> 'data\processed_data\DE\4_2023-05-30.md'
Converted 'data\edgar_documents\DE\4_2023-06-05' --> 'data\processed_data\DE\4_2023-06-05.md'


2025-11-14 16:21:31,515 - INFO - Finished converting document 4_2023-06-07 in 0.08 sec.
2025-11-14 16:21:31,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:31,629 - INFO - Going to convert document batch...
2025-11-14 16:21:31,630 - INFO - Processing document 4_2023-06-08
2025-11-14 16:21:31,690 - INFO - Finished converting document 4_2023-06-08 in 0.12 sec.


Converted 'data\edgar_documents\DE\4_2023-06-07' --> 'data\processed_data\DE\4_2023-06-07.md'
Converted 'data\edgar_documents\DE\4_2023-06-08' --> 'data\processed_data\DE\4_2023-06-08.md'


2025-11-14 16:21:31,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:31,834 - INFO - Going to convert document batch...
2025-11-14 16:21:31,837 - INFO - Processing document 4_2023-06-26
2025-11-14 16:21:31,893 - INFO - Finished converting document 4_2023-06-26 in 0.16 sec.
2025-11-14 16:21:31,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:31,982 - INFO - Going to convert document batch...
2025-11-14 16:21:31,983 - INFO - Processing document 4_2023-07-26
2025-11-14 16:21:32,018 - INFO - Finished converting document 4_2023-07-26 in 0.08 sec.
2025-11-14 16:21:32,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:32,078 - INFO - Going to convert document batch...
2025-11-14 16:21:32,078 - INFO - Processing document 4_2023-08-02
2025-11-14 16:21:32,101 - INFO - Finished converting document 4_2023-08-02 in 0.05 sec.
2025-11-14 16:21:32,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\4_2023-06-26' --> 'data\processed_data\DE\4_2023-06-26.md'
Converted 'data\edgar_documents\DE\4_2023-07-26' --> 'data\processed_data\DE\4_2023-07-26.md'
Converted 'data\edgar_documents\DE\4_2023-08-02' --> 'data\processed_data\DE\4_2023-08-02.md'


2025-11-14 16:21:32,158 - INFO - Going to convert document batch...
2025-11-14 16:21:32,159 - INFO - Processing document 4_2023-08-16
2025-11-14 16:21:32,196 - INFO - Finished converting document 4_2023-08-16 in 0.06 sec.
2025-11-14 16:21:32,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:32,273 - INFO - Going to convert document batch...
2025-11-14 16:21:32,274 - INFO - Processing document 4_2023-10-03
2025-11-14 16:21:32,307 - INFO - Finished converting document 4_2023-10-03 in 0.06 sec.
2025-11-14 16:21:32,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\4_2023-08-16' --> 'data\processed_data\DE\4_2023-08-16.md'
Converted 'data\edgar_documents\DE\4_2023-10-03' --> 'data\processed_data\DE\4_2023-10-03.md'


2025-11-14 16:21:32,428 - INFO - Going to convert document batch...
2025-11-14 16:21:32,429 - INFO - Processing document 4_2023-12-12
2025-11-14 16:21:32,465 - INFO - Finished converting document 4_2023-12-12 in 0.12 sec.
2025-11-14 16:21:32,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:32,544 - INFO - Going to convert document batch...
2025-11-14 16:21:32,545 - INFO - Processing document 4_2023-12-13
2025-11-14 16:21:32,567 - INFO - Finished converting document 4_2023-12-13 in 0.06 sec.
2025-11-14 16:21:32,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:32,627 - INFO - Going to convert document batch...
2025-11-14 16:21:32,628 - INFO - Processing document 4_2023-12-15
2025-11-14 16:21:32,659 - INFO - Finished converting document 4_2023-12-15 in 0.06 sec.


Converted 'data\edgar_documents\DE\4_2023-12-12' --> 'data\processed_data\DE\4_2023-12-12.md'
Converted 'data\edgar_documents\DE\4_2023-12-13' --> 'data\processed_data\DE\4_2023-12-13.md'


2025-11-14 16:21:32,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:32,716 - INFO - Going to convert document batch...
2025-11-14 16:21:32,717 - INFO - Processing document 4_2024-03-07
2025-11-14 16:21:32,749 - INFO - Finished converting document 4_2024-03-07 in 0.06 sec.
2025-11-14 16:21:32,806 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:32,817 - INFO - Going to convert document batch...
2025-11-14 16:21:32,819 - INFO - Processing document 4_2024-05-02
2025-11-14 16:21:32,841 - INFO - Finished converting document 4_2024-05-02 in 0.06 sec.
2025-11-14 16:21:32,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\4_2023-12-15' --> 'data\processed_data\DE\4_2023-12-15.md'
Converted 'data\edgar_documents\DE\4_2024-03-07' --> 'data\processed_data\DE\4_2024-03-07.md'
Converted 'data\edgar_documents\DE\4_2024-05-02' --> 'data\processed_data\DE\4_2024-05-02.md'


2025-11-14 16:21:32,895 - INFO - Going to convert document batch...
2025-11-14 16:21:32,896 - INFO - Processing document 4_2024-06-04
2025-11-14 16:21:32,925 - INFO - Finished converting document 4_2024-06-04 in 0.06 sec.
2025-11-14 16:21:32,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:32,992 - INFO - Going to convert document batch...
2025-11-14 16:21:32,992 - INFO - Processing document 4_2024-06-25
2025-11-14 16:21:33,025 - INFO - Finished converting document 4_2024-06-25 in 0.05 sec.
2025-11-14 16:21:33,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:33,084 - INFO - Going to convert document batch...
2025-11-14 16:21:33,086 - INFO - Processing document 4_2024-08-16
2025-11-14 16:21:33,117 - INFO - Finished converting document 4_2024-08-16 in 0.06 sec.
2025-11-14 16:21:33,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\4_2024-06-04' --> 'data\processed_data\DE\4_2024-06-04.md'
Converted 'data\edgar_documents\DE\4_2024-06-25' --> 'data\processed_data\DE\4_2024-06-25.md'
Converted 'data\edgar_documents\DE\4_2024-08-16' --> 'data\processed_data\DE\4_2024-08-16.md'


2025-11-14 16:21:33,181 - INFO - Going to convert document batch...
2025-11-14 16:21:33,182 - INFO - Processing document 4_2024-11-01
2025-11-14 16:21:33,273 - INFO - Finished converting document 4_2024-11-01 in 0.11 sec.
2025-11-14 16:21:33,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:33,374 - INFO - Going to convert document batch...
2025-11-14 16:21:33,374 - INFO - Processing document 4_2024-11-04
2025-11-14 16:21:33,401 - INFO - Finished converting document 4_2024-11-04 in 0.09 sec.
2025-11-14 16:21:33,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:33,459 - INFO - Going to convert document batch...
2025-11-14 16:21:33,460 - INFO - Processing document 4_2024-12-13
2025-11-14 16:21:33,487 - INFO - Finished converting document 4_2024-12-13 in 0.05 sec.


Converted 'data\edgar_documents\DE\4_2024-11-01' --> 'data\processed_data\DE\4_2024-11-01.md'
Converted 'data\edgar_documents\DE\4_2024-11-04' --> 'data\processed_data\DE\4_2024-11-04.md'


2025-11-14 16:21:33,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:33,548 - INFO - Going to convert document batch...
2025-11-14 16:21:33,550 - INFO - Processing document 4_2024-12-16
2025-11-14 16:21:33,588 - INFO - Finished converting document 4_2024-12-16 in 0.08 sec.
2025-11-14 16:21:33,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:33,652 - INFO - Going to convert document batch...
2025-11-14 16:21:33,653 - INFO - Processing document 4_2024-12-17
2025-11-14 16:21:33,680 - INFO - Finished converting document 4_2024-12-17 in 0.05 sec.


Converted 'data\edgar_documents\DE\4_2024-12-13' --> 'data\processed_data\DE\4_2024-12-13.md'
Converted 'data\edgar_documents\DE\4_2024-12-16' --> 'data\processed_data\DE\4_2024-12-16.md'


2025-11-14 16:21:33,737 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:21:33,740 - ERROR - Input document 4_2025-01-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:21:33,742 - INFO - Going to convert document batch...
2025-11-14 16:21:33,775 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:21:33,776 - ERROR - Input document 4_2025-01-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\DE\4_2024-12-17' --> 'data\processed_data\DE\4_2024-12-17.md'
Error processing data\edgar_documents\DE\4_2025-01-13: File format not allowed: data\edgar_documents\DE\4_2025-01-13
Error processing data\edgar_documents\DE\4_2025-01-15: File format not allowed: data\edgar_documents\DE\4_2025-01-15
Converted 'data\edgar_documents\DE\4_2025-02-19' --> 'data\processed_data\DE\4_2025-02-19.md'


2025-11-14 16:21:33,908 - INFO - Going to convert document batch...
2025-11-14 16:21:33,908 - INFO - Processing document 4_2025-03-06
2025-11-14 16:21:33,937 - INFO - Finished converting document 4_2025-03-06 in 0.06 sec.
2025-11-14 16:21:33,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:33,988 - INFO - Going to convert document batch...
2025-11-14 16:21:33,988 - INFO - Processing document 4_2025-05-02
2025-11-14 16:21:34,011 - INFO - Finished converting document 4_2025-05-02 in 0.05 sec.
2025-11-14 16:21:34,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:34,057 - INFO - Going to convert document batch...
2025-11-14 16:21:34,058 - INFO - Processing document 4_2025-06-03
2025-11-14 16:21:34,082 - INFO - Finished converting document 4_2025-06-03 in 0.05 sec.
2025-11-14 16:21:34,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:34,133 - INFO - Going to convert document batch...
2025-11-14 16:21:34,134 - 

Converted 'data\edgar_documents\DE\4_2025-03-06' --> 'data\processed_data\DE\4_2025-03-06.md'
Converted 'data\edgar_documents\DE\4_2025-05-02' --> 'data\processed_data\DE\4_2025-05-02.md'
Converted 'data\edgar_documents\DE\4_2025-06-03' --> 'data\processed_data\DE\4_2025-06-03.md'


2025-11-14 16:21:34,219 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:21:34,221 - ERROR - Input document 4_2025-10-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:21:34,223 - INFO - Going to convert document batch...
2025-11-14 16:21:34,254 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:21:34,256 - ERROR - Input document 4_2025-10-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\DE\4_2025-08-18' --> 'data\processed_data\DE\4_2025-08-18.md'
Error processing data\edgar_documents\DE\4_2025-10-02: File format not allowed: data\edgar_documents\DE\4_2025-10-02
Error processing data\edgar_documents\DE\4_2025-10-03: File format not allowed: data\edgar_documents\DE\4_2025-10-03
Converted 'data\edgar_documents\DE\4_2025-11-03' --> 'data\processed_data\DE\4_2025-11-03.md'


2025-11-14 16:21:34,426 - INFO - Going to convert document batch...
2025-11-14 16:21:34,428 - INFO - Processing document 8-K_2023-02-17
2025-11-14 16:21:34,462 - INFO - Finished converting document 8-K_2023-02-17 in 0.09 sec.
2025-11-14 16:21:34,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:34,514 - INFO - Going to convert document batch...
2025-11-14 16:21:34,515 - INFO - Processing document 8-K_2023-02-22
2025-11-14 16:21:34,544 - INFO - Finished converting document 8-K_2023-02-22 in 0.06 sec.
2025-11-14 16:21:34,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:34,618 - INFO - Going to convert document batch...
2025-11-14 16:21:34,619 - INFO - Processing document 8-K_2023-02-27
2025-11-14 16:21:34,672 - INFO - Finished converting document 8-K_2023-02-27 in 0.11 sec.


Converted 'data\edgar_documents\DE\8-K_2023-02-17' --> 'data\processed_data\DE\8-K_2023-02-17.md'
Converted 'data\edgar_documents\DE\8-K_2023-02-22' --> 'data\processed_data\DE\8-K_2023-02-22.md'


2025-11-14 16:21:34,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:34,753 - INFO - Going to convert document batch...
2025-11-14 16:21:34,754 - INFO - Processing document 8-K_2023-05-19
2025-11-14 16:21:34,828 - INFO - Finished converting document 8-K_2023-05-19 in 0.14 sec.
2025-11-14 16:21:34,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\8-K_2023-02-27' --> 'data\processed_data\DE\8-K_2023-02-27.md'
Converted 'data\edgar_documents\DE\8-K_2023-05-19' --> 'data\processed_data\DE\8-K_2023-05-19.md'


2025-11-14 16:21:34,894 - INFO - Going to convert document batch...
2025-11-14 16:21:34,896 - INFO - Processing document 8-K_2023-05-31
2025-11-14 16:21:34,929 - INFO - Finished converting document 8-K_2023-05-31 in 0.08 sec.
2025-11-14 16:21:34,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:34,991 - INFO - Going to convert document batch...
2025-11-14 16:21:34,992 - INFO - Processing document 8-K_2023-08-01
2025-11-14 16:21:35,018 - INFO - Finished converting document 8-K_2023-08-01 in 0.06 sec.
2025-11-14 16:21:35,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:35,063 - INFO - Going to convert document batch...
2025-11-14 16:21:35,063 - INFO - Processing document 8-K_2023-08-18
2025-11-14 16:21:35,083 - INFO - Finished converting document 8-K_2023-08-18 in 0.05 sec.
2025-11-14 16:21:35,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:35,124 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\DE\8-K_2023-05-31' --> 'data\processed_data\DE\8-K_2023-05-31.md'
Converted 'data\edgar_documents\DE\8-K_2023-08-01' --> 'data\processed_data\DE\8-K_2023-08-01.md'
Converted 'data\edgar_documents\DE\8-K_2023-08-18' --> 'data\processed_data\DE\8-K_2023-08-18.md'


2025-11-14 16:21:35,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:35,184 - INFO - Going to convert document batch...
2025-11-14 16:21:35,185 - INFO - Processing document 8-K_2023-10-03
2025-11-14 16:21:35,216 - INFO - Finished converting document 8-K_2023-10-03 in 0.06 sec.
2025-11-14 16:21:35,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:35,317 - INFO - Going to convert document batch...
2025-11-14 16:21:35,319 - INFO - Processing document 8-K_2023-10-30


Converted 'data\edgar_documents\DE\8-K_2023-08-30' --> 'data\processed_data\DE\8-K_2023-08-30.md'
Converted 'data\edgar_documents\DE\8-K_2023-10-03' --> 'data\processed_data\DE\8-K_2023-10-03.md'


2025-11-14 16:21:35,359 - INFO - Finished converting document 8-K_2023-10-30 in 0.12 sec.
2025-11-14 16:21:35,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:35,443 - INFO - Going to convert document batch...
2025-11-14 16:21:35,444 - INFO - Processing document 8-K_2023-11-22
2025-11-14 16:21:35,471 - INFO - Finished converting document 8-K_2023-11-22 in 0.09 sec.
2025-11-14 16:21:35,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:35,545 - INFO - Going to convert document batch...
2025-11-14 16:21:35,546 - INFO - Processing document 8-K_2023-12-06


Converted 'data\edgar_documents\DE\8-K_2023-10-30' --> 'data\processed_data\DE\8-K_2023-10-30.md'
Converted 'data\edgar_documents\DE\8-K_2023-11-22' --> 'data\processed_data\DE\8-K_2023-11-22.md'


2025-11-14 16:21:35,578 - INFO - Finished converting document 8-K_2023-12-06 in 0.09 sec.
2025-11-14 16:21:35,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:35,654 - INFO - Going to convert document batch...
2025-11-14 16:21:35,655 - INFO - Processing document 8-K_2024-02-15
2025-11-14 16:21:35,693 - INFO - Finished converting document 8-K_2024-02-15 in 0.08 sec.
2025-11-14 16:21:35,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\8-K_2023-12-06' --> 'data\processed_data\DE\8-K_2023-12-06.md'
Converted 'data\edgar_documents\DE\8-K_2024-02-15' --> 'data\processed_data\DE\8-K_2024-02-15.md'


2025-11-14 16:21:35,798 - INFO - Going to convert document batch...
2025-11-14 16:21:35,800 - INFO - Processing document 8-K_2024-03-01
2025-11-14 16:21:35,888 - INFO - Finished converting document 8-K_2024-03-01 in 0.17 sec.
2025-11-14 16:21:35,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:35,958 - INFO - Going to convert document batch...
2025-11-14 16:21:35,959 - INFO - Processing document 8-K_2024-05-16
2025-11-14 16:21:35,998 - INFO - Finished converting document 8-K_2024-05-16 in 0.08 sec.
2025-11-14 16:21:36,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:36,051 - INFO - Going to convert document batch...
2025-11-14 16:21:36,052 - INFO - Processing document 8-K_2024-06-05
2025-11-14 16:21:36,071 - INFO - Finished converting document 8-K_2024-06-05 in 0.05 sec.
2025-11-14 16:21:36,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\8-K_2024-03-01' --> 'data\processed_data\DE\8-K_2024-03-01.md'
Converted 'data\edgar_documents\DE\8-K_2024-05-16' --> 'data\processed_data\DE\8-K_2024-05-16.md'
Converted 'data\edgar_documents\DE\8-K_2024-06-05' --> 'data\processed_data\DE\8-K_2024-06-05.md'


2025-11-14 16:21:36,128 - INFO - Going to convert document batch...
2025-11-14 16:21:36,129 - INFO - Processing document 8-K_2024-08-15
2025-11-14 16:21:36,157 - INFO - Finished converting document 8-K_2024-08-15 in 0.08 sec.
2025-11-14 16:21:36,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:36,223 - INFO - Going to convert document batch...
2025-11-14 16:21:36,224 - INFO - Processing document 8-K_2024-11-01
2025-11-14 16:21:36,253 - INFO - Finished converting document 8-K_2024-11-01 in 0.08 sec.
2025-11-14 16:21:36,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:36,300 - INFO - Going to convert document batch...
2025-11-14 16:21:36,301 - INFO - Processing document 8-K_2024-11-21
2025-11-14 16:21:36,321 - INFO - Finished converting document 8-K_2024-11-21 in 0.05 sec.
2025-11-14 16:21:36,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:36,361 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\DE\8-K_2024-08-15' --> 'data\processed_data\DE\8-K_2024-08-15.md'
Converted 'data\edgar_documents\DE\8-K_2024-11-01' --> 'data\processed_data\DE\8-K_2024-11-01.md'
Converted 'data\edgar_documents\DE\8-K_2024-11-21' --> 'data\processed_data\DE\8-K_2024-11-21.md'


2025-11-14 16:21:36,361 - INFO - Processing document 8-K_2024-12-03
2025-11-14 16:21:36,384 - INFO - Finished converting document 8-K_2024-12-03 in 0.05 sec.
2025-11-14 16:21:36,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:36,493 - INFO - Going to convert document batch...
2025-11-14 16:21:36,494 - INFO - Processing document 8-K_2025-01-16
2025-11-14 16:21:36,528 - INFO - Finished converting document 8-K_2025-01-16 in 0.14 sec.


Converted 'data\edgar_documents\DE\8-K_2024-12-03' --> 'data\processed_data\DE\8-K_2024-12-03.md'
Converted 'data\edgar_documents\DE\8-K_2025-01-16' --> 'data\processed_data\DE\8-K_2025-01-16.md'


2025-11-14 16:21:36,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:36,620 - INFO - Going to convert document batch...
2025-11-14 16:21:36,621 - INFO - Processing document 8-K_2025-02-13
2025-11-14 16:21:36,657 - INFO - Finished converting document 8-K_2025-02-13 in 0.11 sec.
2025-11-14 16:21:36,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:36,723 - INFO - Going to convert document batch...
2025-11-14 16:21:36,725 - INFO - Processing document 8-K_2025-02-28
2025-11-14 16:21:36,802 - INFO - Finished converting document 8-K_2025-02-28 in 0.12 sec.


Converted 'data\edgar_documents\DE\8-K_2025-02-13' --> 'data\processed_data\DE\8-K_2025-02-13.md'
Converted 'data\edgar_documents\DE\8-K_2025-02-28' --> 'data\processed_data\DE\8-K_2025-02-28.md'


2025-11-14 16:21:36,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:36,885 - INFO - Going to convert document batch...
2025-11-14 16:21:36,886 - INFO - Processing document 8-K_2025-05-15
2025-11-14 16:21:36,913 - INFO - Finished converting document 8-K_2025-05-15 in 0.08 sec.
2025-11-14 16:21:36,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:36,956 - INFO - Going to convert document batch...
2025-11-14 16:21:36,957 - INFO - Processing document 8-K_2025-07-07
2025-11-14 16:21:36,975 - INFO - Finished converting document 8-K_2025-07-07 in 0.05 sec.
2025-11-14 16:21:37,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:37,018 - INFO - Going to convert document batch...
2025-11-14 16:21:37,020 - INFO - Processing document 8-K_2025-08-14
2025-11-14 16:21:37,051 - INFO - Finished converting document 8-K_2025-08-14 in 0.06 sec.
2025-11-14 16:21:37,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\DE\8-K_2025-05-15' --> 'data\processed_data\DE\8-K_2025-05-15.md'
Converted 'data\edgar_documents\DE\8-K_2025-07-07' --> 'data\processed_data\DE\8-K_2025-07-07.md'
Converted 'data\edgar_documents\DE\8-K_2025-08-14' --> 'data\processed_data\DE\8-K_2025-08-14.md'


2025-11-14 16:21:37,161 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:37,180 - INFO - Going to convert document batch...
2025-11-14 16:21:37,181 - INFO - Processing document 8-K_2025-10-09
2025-11-14 16:21:37,207 - INFO - Finished converting document 8-K_2025-10-09 in 0.06 sec.


Converted 'data\edgar_documents\DE\8-K_2025-09-02' --> 'data\processed_data\DE\8-K_2025-09-02.md'
Converted 'data\edgar_documents\DE\8-K_2025-10-09' --> 'data\processed_data\DE\8-K_2025-10-09.md'


2025-11-14 16:21:37,417 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:21:37,418 - ERROR - Input document DEF-14A_2023-01-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:21:37,427 - INFO - Going to convert document batch...


Error processing data\edgar_documents\DE\DEF-14A_2023-01-11: File format not allowed: data\edgar_documents\DE\DEF-14A_2023-01-11


2025-11-14 16:21:37,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:40,468 - INFO - Going to convert document batch...
2025-11-14 16:21:40,469 - INFO - Processing document DEF-14A_2024-01-10
2025-11-14 16:21:53,158 - INFO - Finished converting document DEF-14A_2024-01-10 in 15.72 sec.


Converted 'data\edgar_documents\DE\DEF-14A_2024-01-10' --> 'data\processed_data\DE\DEF-14A_2024-01-10.md'


2025-11-14 16:21:55,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:21:58,235 - INFO - Going to convert document batch...
2025-11-14 16:21:58,236 - INFO - Processing document DEF-14A_2025-01-10
2025-11-14 16:22:12,125 - INFO - Finished converting document DEF-14A_2025-01-10 in 17.11 sec.
2025-11-14 16:22:13,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\DEF-14A_2025-01-10' --> 'data\processed_data\DE\DEF-14A_2025-01-10.md'
Processed 70 new files. Errors: 5
Found 112 files to process in data\edgar_documents\DHR


2025-11-14 16:22:15,025 - INFO - Going to convert document batch...
2025-11-14 16:22:15,027 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:22:15,028 - INFO - Processing document 10-K_2023-02-22
2025-11-14 16:22:18,348 - INFO - Finished converting document 10-K_2023-02-22 in 4.67 sec.
2025-11-14 16:22:19,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-K_2023-02-22' --> 'data\processed_data\DHR\10-K_2023-02-22.md'


2025-11-14 16:22:21,315 - INFO - Going to convert document batch...
2025-11-14 16:22:21,315 - INFO - Processing document 10-K_2024-02-21
2025-11-14 16:22:23,733 - INFO - Finished converting document 10-K_2024-02-21 in 4.50 sec.
2025-11-14 16:22:24,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-K_2024-02-21' --> 'data\processed_data\DHR\10-K_2024-02-21.md'


2025-11-14 16:22:25,593 - INFO - Going to convert document batch...
2025-11-14 16:22:25,594 - INFO - Processing document 10-K_2025-02-20
2025-11-14 16:22:28,516 - INFO - Finished converting document 10-K_2025-02-20 in 4.00 sec.
2025-11-14 16:22:29,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-K_2025-02-20' --> 'data\processed_data\DHR\10-K_2025-02-20.md'


2025-11-14 16:22:29,952 - INFO - Going to convert document batch...
2025-11-14 16:22:29,953 - INFO - Processing document 10-Q_2023-04-25
2025-11-14 16:22:30,675 - INFO - Finished converting document 10-Q_2023-04-25 in 1.27 sec.
2025-11-14 16:22:31,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-Q_2023-04-25' --> 'data\processed_data\DHR\10-Q_2023-04-25.md'


2025-11-14 16:22:31,778 - INFO - Going to convert document batch...
2025-11-14 16:22:31,780 - INFO - Processing document 10-Q_2023-07-25
2025-11-14 16:22:32,875 - INFO - Finished converting document 10-Q_2023-07-25 in 1.80 sec.
2025-11-14 16:22:33,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-Q_2023-07-25' --> 'data\processed_data\DHR\10-Q_2023-07-25.md'


2025-11-14 16:22:34,839 - INFO - Going to convert document batch...
2025-11-14 16:22:34,839 - INFO - Processing document 10-Q_2023-10-24
2025-11-14 16:22:35,997 - INFO - Finished converting document 10-Q_2023-10-24 in 2.50 sec.
2025-11-14 16:22:36,932 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-Q_2023-10-24' --> 'data\processed_data\DHR\10-Q_2023-10-24.md'


2025-11-14 16:22:37,345 - INFO - Going to convert document batch...
2025-11-14 16:22:37,346 - INFO - Processing document 10-Q_2024-04-23
2025-11-14 16:22:38,102 - INFO - Finished converting document 10-Q_2024-04-23 in 1.22 sec.
2025-11-14 16:22:40,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-Q_2024-04-23' --> 'data\processed_data\DHR\10-Q_2024-04-23.md'


2025-11-14 16:22:41,812 - INFO - Going to convert document batch...
2025-11-14 16:22:41,814 - INFO - Processing document 10-Q_2024-07-23
2025-11-14 16:22:46,319 - INFO - Finished converting document 10-Q_2024-07-23 in 5.97 sec.
2025-11-14 16:22:48,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-Q_2024-07-23' --> 'data\processed_data\DHR\10-Q_2024-07-23.md'


2025-11-14 16:22:51,595 - INFO - Going to convert document batch...
2025-11-14 16:22:51,596 - INFO - Processing document 10-Q_2024-10-22
2025-11-14 16:22:54,386 - INFO - Finished converting document 10-Q_2024-10-22 in 6.34 sec.
2025-11-14 16:22:55,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-Q_2024-10-22' --> 'data\processed_data\DHR\10-Q_2024-10-22.md'


2025-11-14 16:22:56,857 - INFO - Going to convert document batch...
2025-11-14 16:22:56,859 - INFO - Processing document 10-Q_2025-04-22
2025-11-14 16:22:59,702 - INFO - Finished converting document 10-Q_2025-04-22 in 4.25 sec.
2025-11-14 16:23:00,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-Q_2025-04-22' --> 'data\processed_data\DHR\10-Q_2025-04-22.md'


2025-11-14 16:23:03,438 - INFO - Going to convert document batch...
2025-11-14 16:23:03,440 - INFO - Processing document 10-Q_2025-07-22
2025-11-14 16:23:06,180 - INFO - Finished converting document 10-Q_2025-07-22 in 5.42 sec.
2025-11-14 16:23:07,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\10-Q_2025-07-22' --> 'data\processed_data\DHR\10-Q_2025-07-22.md'


2025-11-14 16:23:09,421 - INFO - Going to convert document batch...
2025-11-14 16:23:09,422 - INFO - Processing document 10-Q_2025-10-21
2025-11-14 16:23:12,690 - INFO - Finished converting document 10-Q_2025-10-21 in 5.12 sec.
2025-11-14 16:23:16,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:16,794 - INFO - Going to convert document batch...
2025-11-14 16:23:16,797 - INFO - Processing document 4_2023-01-03
2025-11-14 16:23:16,869 - INFO - Finished converting document 4_2023-01-03 in 0.12 sec.


Converted 'data\edgar_documents\DHR\10-Q_2025-10-21' --> 'data\processed_data\DHR\10-Q_2025-10-21.md'


2025-11-14 16:23:16,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:17,037 - INFO - Going to convert document batch...
2025-11-14 16:23:17,039 - INFO - Processing document 4_2023-01-26


Converted 'data\edgar_documents\DHR\4_2023-01-03' --> 'data\processed_data\DHR\4_2023-01-03.md'


2025-11-14 16:23:17,160 - INFO - Finished converting document 4_2023-01-26 in 0.20 sec.
2025-11-14 16:23:17,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:17,311 - INFO - Going to convert document batch...
2025-11-14 16:23:17,314 - INFO - Processing document 4_2023-01-30
2025-11-14 16:23:17,401 - INFO - Finished converting document 4_2023-01-30 in 0.16 sec.


Converted 'data\edgar_documents\DHR\4_2023-01-26' --> 'data\processed_data\DHR\4_2023-01-26.md'


2025-11-14 16:23:17,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:17,539 - INFO - Going to convert document batch...
2025-11-14 16:23:17,542 - INFO - Processing document 4_2023-02-02
2025-11-14 16:23:17,640 - INFO - Finished converting document 4_2023-02-02 in 0.17 sec.


Converted 'data\edgar_documents\DHR\4_2023-01-30' --> 'data\processed_data\DHR\4_2023-01-30.md'


2025-11-14 16:23:17,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:17,787 - INFO - Going to convert document batch...
2025-11-14 16:23:17,790 - INFO - Processing document 4_2023-02-03
2025-11-14 16:23:17,885 - INFO - Finished converting document 4_2023-02-03 in 0.14 sec.


Converted 'data\edgar_documents\DHR\4_2023-02-02' --> 'data\processed_data\DHR\4_2023-02-02.md'


2025-11-14 16:23:18,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:18,104 - INFO - Going to convert document batch...
2025-11-14 16:23:18,106 - INFO - Processing document 4_2023-02-23
2025-11-14 16:23:18,182 - INFO - Finished converting document 4_2023-02-23 in 0.12 sec.


Converted 'data\edgar_documents\DHR\4_2023-02-03' --> 'data\processed_data\DHR\4_2023-02-03.md'
Converted 'data\edgar_documents\DHR\4_2023-02-23' --> 'data\processed_data\DHR\4_2023-02-23.md'


2025-11-14 16:23:18,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:18,341 - INFO - Going to convert document batch...
2025-11-14 16:23:18,345 - INFO - Processing document 4_2023-02-28
2025-11-14 16:23:18,435 - INFO - Finished converting document 4_2023-02-28 in 0.19 sec.
2025-11-14 16:23:18,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:18,642 - INFO - Going to convert document batch...
2025-11-14 16:23:18,644 - INFO - Processing document 4_2023-04-17


Converted 'data\edgar_documents\DHR\4_2023-02-28' --> 'data\processed_data\DHR\4_2023-02-28.md'


2025-11-14 16:23:18,753 - INFO - Finished converting document 4_2023-04-17 in 0.22 sec.
2025-11-14 16:23:18,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:18,970 - INFO - Going to convert document batch...
2025-11-14 16:23:18,971 - INFO - Processing document 4_2023-04-18
2025-11-14 16:23:19,076 - INFO - Finished converting document 4_2023-04-18 in 0.20 sec.


Converted 'data\edgar_documents\DHR\4_2023-04-17' --> 'data\processed_data\DHR\4_2023-04-17.md'


2025-11-14 16:23:19,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:19,258 - INFO - Going to convert document batch...
2025-11-14 16:23:19,260 - INFO - Processing document 4_2023-05-01
2025-11-14 16:23:19,371 - INFO - Finished converting document 4_2023-05-01 in 0.17 sec.


Converted 'data\edgar_documents\DHR\4_2023-04-18' --> 'data\processed_data\DHR\4_2023-04-18.md'


2025-11-14 16:23:19,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\4_2023-05-01' --> 'data\processed_data\DHR\4_2023-05-01.md'


2025-11-14 16:23:20,198 - INFO - Going to convert document batch...
2025-11-14 16:23:20,200 - INFO - Processing document 4_2023-05-02
2025-11-14 16:23:20,277 - INFO - Finished converting document 4_2023-05-02 in 0.78 sec.
2025-11-14 16:23:20,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:20,477 - INFO - Going to convert document batch...
2025-11-14 16:23:20,481 - INFO - Processing document 4_2023-05-05


Converted 'data\edgar_documents\DHR\4_2023-05-02' --> 'data\processed_data\DHR\4_2023-05-02.md'


2025-11-14 16:23:20,824 - INFO - Finished converting document 4_2023-05-05 in 0.44 sec.
2025-11-14 16:23:20,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:21,027 - INFO - Going to convert document batch...
2025-11-14 16:23:21,028 - INFO - Processing document 4_2023-05-08
2025-11-14 16:23:21,111 - INFO - Finished converting document 4_2023-05-08 in 0.17 sec.


Converted 'data\edgar_documents\DHR\4_2023-05-05' --> 'data\processed_data\DHR\4_2023-05-05.md'


2025-11-14 16:23:21,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:21,259 - INFO - Going to convert document batch...
2025-11-14 16:23:21,261 - INFO - Processing document 4_2023-05-17
2025-11-14 16:23:21,350 - INFO - Finished converting document 4_2023-05-17 in 0.14 sec.


Converted 'data\edgar_documents\DHR\4_2023-05-08' --> 'data\processed_data\DHR\4_2023-05-08.md'


2025-11-14 16:23:21,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:21,538 - INFO - Going to convert document batch...
2025-11-14 16:23:21,540 - INFO - Processing document 4_2023-06-01
2025-11-14 16:23:21,628 - INFO - Finished converting document 4_2023-06-01 in 0.16 sec.


Converted 'data\edgar_documents\DHR\4_2023-05-17' --> 'data\processed_data\DHR\4_2023-05-17.md'


2025-11-14 16:23:21,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:21,800 - INFO - Going to convert document batch...
2025-11-14 16:23:21,802 - INFO - Processing document 4_2023-07-18
2025-11-14 16:23:21,884 - INFO - Finished converting document 4_2023-07-18 in 0.14 sec.


Converted 'data\edgar_documents\DHR\4_2023-06-01' --> 'data\processed_data\DHR\4_2023-06-01.md'


2025-11-14 16:23:22,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\4_2023-07-18' --> 'data\processed_data\DHR\4_2023-07-18.md'


2025-11-14 16:23:22,245 - INFO - Going to convert document batch...
2025-11-14 16:23:22,248 - INFO - Processing document 4_2023-07-27
2025-11-14 16:23:22,533 - INFO - Finished converting document 4_2023-07-27 in 0.53 sec.
2025-11-14 16:23:22,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:22,684 - INFO - Going to convert document batch...
2025-11-14 16:23:22,686 - INFO - Processing document 4_2023-08-01
2025-11-14 16:23:22,764 - INFO - Finished converting document 4_2023-08-01 in 0.14 sec.


Converted 'data\edgar_documents\DHR\4_2023-07-27' --> 'data\processed_data\DHR\4_2023-07-27.md'


2025-11-14 16:23:22,889 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:22,918 - INFO - Going to convert document batch...
2025-11-14 16:23:22,920 - INFO - Processing document 4_2023-08-22
2025-11-14 16:23:22,984 - INFO - Finished converting document 4_2023-08-22 in 0.14 sec.


Converted 'data\edgar_documents\DHR\4_2023-08-01' --> 'data\processed_data\DHR\4_2023-08-01.md'


2025-11-14 16:23:23,086 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:23,122 - INFO - Going to convert document batch...
2025-11-14 16:23:23,124 - INFO - Processing document 4_2023-10-02
2025-11-14 16:23:23,194 - INFO - Finished converting document 4_2023-10-02 in 0.12 sec.


Converted 'data\edgar_documents\DHR\4_2023-08-22' --> 'data\processed_data\DHR\4_2023-08-22.md'


2025-11-14 16:23:23,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:23,518 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\DHR\4_2023-10-02' --> 'data\processed_data\DHR\4_2023-10-02.md'


2025-11-14 16:23:23,522 - INFO - Processing document 4_2023-10-30
2025-11-14 16:23:23,615 - INFO - Finished converting document 4_2023-10-30 in 0.28 sec.
2025-11-14 16:23:23,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:23,778 - INFO - Going to convert document batch...
2025-11-14 16:23:23,780 - INFO - Processing document 4_2024-01-02
2025-11-14 16:23:23,854 - INFO - Finished converting document 4_2024-01-02 in 0.16 sec.


Converted 'data\edgar_documents\DHR\4_2023-10-30' --> 'data\processed_data\DHR\4_2023-10-30.md'


2025-11-14 16:23:23,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:23,978 - INFO - Going to convert document batch...
2025-11-14 16:23:23,980 - INFO - Processing document 4_2024-01-30
2025-11-14 16:23:24,057 - INFO - Finished converting document 4_2024-01-30 in 0.14 sec.


Converted 'data\edgar_documents\DHR\4_2024-01-02' --> 'data\processed_data\DHR\4_2024-01-02.md'


2025-11-14 16:23:24,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:24,205 - INFO - Going to convert document batch...
2025-11-14 16:23:24,208 - INFO - Processing document 4_2024-02-02
2025-11-14 16:23:24,278 - INFO - Finished converting document 4_2024-02-02 in 0.14 sec.


Converted 'data\edgar_documents\DHR\4_2024-01-30' --> 'data\processed_data\DHR\4_2024-01-30.md'


2025-11-14 16:23:24,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:24,804 - INFO - Going to convert document batch...
2025-11-14 16:23:24,806 - INFO - Processing document 4_2024-02-05
2025-11-14 16:23:24,880 - INFO - Finished converting document 4_2024-02-05 in 0.12 sec.


Converted 'data\edgar_documents\DHR\4_2024-02-02' --> 'data\processed_data\DHR\4_2024-02-02.md'


2025-11-14 16:23:25,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:25,042 - INFO - Going to convert document batch...
2025-11-14 16:23:25,044 - INFO - Processing document 4_2024-02-08
2025-11-14 16:23:25,122 - INFO - Finished converting document 4_2024-02-08 in 0.17 sec.


Converted 'data\edgar_documents\DHR\4_2024-02-05' --> 'data\processed_data\DHR\4_2024-02-05.md'


2025-11-14 16:23:25,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\4_2024-02-08' --> 'data\processed_data\DHR\4_2024-02-08.md'


2025-11-14 16:23:25,495 - INFO - Going to convert document batch...
2025-11-14 16:23:25,499 - INFO - Processing document 4_2024-02-14
2025-11-14 16:23:25,585 - INFO - Finished converting document 4_2024-02-14 in 0.39 sec.
2025-11-14 16:23:25,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:25,730 - INFO - Going to convert document batch...
2025-11-14 16:23:25,731 - INFO - Processing document 4_2024-02-16
2025-11-14 16:23:25,786 - INFO - Finished converting document 4_2024-02-16 in 0.12 sec.


Converted 'data\edgar_documents\DHR\4_2024-02-14' --> 'data\processed_data\DHR\4_2024-02-14.md'
Converted 'data\edgar_documents\DHR\4_2024-02-16' --> 'data\processed_data\DHR\4_2024-02-16.md'


2025-11-14 16:23:25,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:25,955 - INFO - Going to convert document batch...
2025-11-14 16:23:25,977 - INFO - Processing document 4_2024-02-23
2025-11-14 16:23:26,495 - INFO - Finished converting document 4_2024-02-23 in 0.64 sec.
2025-11-14 16:23:26,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:26,686 - INFO - Going to convert document batch...
2025-11-14 16:23:26,688 - INFO - Processing document 4_2024-02-27
2025-11-14 16:23:26,765 - INFO - Finished converting document 4_2024-02-27 in 0.14 sec.


Converted 'data\edgar_documents\DHR\4_2024-02-23' --> 'data\processed_data\DHR\4_2024-02-23.md'


2025-11-14 16:23:26,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:26,901 - INFO - Going to convert document batch...
2025-11-14 16:23:26,905 - INFO - Processing document 4_2024-03-05
2025-11-14 16:23:26,988 - INFO - Finished converting document 4_2024-03-05 in 0.14 sec.


Converted 'data\edgar_documents\DHR\4_2024-02-27' --> 'data\processed_data\DHR\4_2024-02-27.md'


2025-11-14 16:23:27,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:27,116 - INFO - Going to convert document batch...
2025-11-14 16:23:27,117 - INFO - Processing document 4_2024-04-25
2025-11-14 16:23:27,190 - INFO - Finished converting document 4_2024-04-25 in 0.12 sec.


Converted 'data\edgar_documents\DHR\4_2024-03-05' --> 'data\processed_data\DHR\4_2024-03-05.md'


2025-11-14 16:23:27,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\4_2024-04-25' --> 'data\processed_data\DHR\4_2024-04-25.md'


2025-11-14 16:23:27,502 - INFO - Going to convert document batch...
2025-11-14 16:23:27,515 - INFO - Processing document 4_2024-04-26
2025-11-14 16:23:27,623 - INFO - Finished converting document 4_2024-04-26 in 0.34 sec.
2025-11-14 16:23:27,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:27,746 - INFO - Going to convert document batch...
2025-11-14 16:23:27,747 - INFO - Processing document 4_2024-04-29
2025-11-14 16:23:27,823 - INFO - Finished converting document 4_2024-04-29 in 0.12 sec.


Converted 'data\edgar_documents\DHR\4_2024-04-26' --> 'data\processed_data\DHR\4_2024-04-26.md'


2025-11-14 16:23:28,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:28,029 - INFO - Going to convert document batch...
2025-11-14 16:23:28,031 - INFO - Processing document 4_2024-05-03
2025-11-14 16:23:28,065 - INFO - Finished converting document 4_2024-05-03 in 0.11 sec.
2025-11-14 16:23:28,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:28,145 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\DHR\4_2024-04-29' --> 'data\processed_data\DHR\4_2024-04-29.md'
Converted 'data\edgar_documents\DHR\4_2024-05-03' --> 'data\processed_data\DHR\4_2024-05-03.md'


2025-11-14 16:23:28,148 - INFO - Processing document 4_2024-05-13
2025-11-14 16:23:28,220 - INFO - Finished converting document 4_2024-05-13 in 0.12 sec.
2025-11-14 16:23:28,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:28,336 - INFO - Going to convert document batch...
2025-11-14 16:23:28,337 - INFO - Processing document 4_2024-05-15
2025-11-14 16:23:28,378 - INFO - Finished converting document 4_2024-05-15 in 0.11 sec.
2025-11-14 16:23:28,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:28,445 - INFO - Going to convert document batch...
2025-11-14 16:23:28,446 - INFO - Processing document 4_2024-05-17


Converted 'data\edgar_documents\DHR\4_2024-05-13' --> 'data\processed_data\DHR\4_2024-05-13.md'
Converted 'data\edgar_documents\DHR\4_2024-05-15' --> 'data\processed_data\DHR\4_2024-05-15.md'


2025-11-14 16:23:28,479 - INFO - Finished converting document 4_2024-05-17 in 0.08 sec.
2025-11-14 16:23:28,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:28,556 - INFO - Going to convert document batch...
2025-11-14 16:23:28,557 - INFO - Processing document 4_2024-07-16
2025-11-14 16:23:28,593 - INFO - Finished converting document 4_2024-07-16 in 0.08 sec.
2025-11-14 16:23:28,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:28,662 - INFO - Going to convert document batch...
2025-11-14 16:23:28,664 - INFO - Processing document 4_2024-07-26
2025-11-14 16:23:28,693 - INFO - Finished converting document 4_2024-07-26 in 0.06 sec.


Converted 'data\edgar_documents\DHR\4_2024-05-17' --> 'data\processed_data\DHR\4_2024-05-17.md'
Converted 'data\edgar_documents\DHR\4_2024-07-16' --> 'data\processed_data\DHR\4_2024-07-16.md'
Converted 'data\edgar_documents\DHR\4_2024-07-26' --> 'data\processed_data\DHR\4_2024-07-26.md'


2025-11-14 16:23:28,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:28,769 - INFO - Going to convert document batch...
2025-11-14 16:23:28,771 - INFO - Processing document 4_2024-07-29
2025-11-14 16:23:28,874 - INFO - Finished converting document 4_2024-07-29 in 0.16 sec.
2025-11-14 16:23:28,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:28,982 - INFO - Going to convert document batch...
2025-11-14 16:23:28,985 - INFO - Processing document 4_2024-08-02
2025-11-14 16:23:29,017 - INFO - Finished converting document 4_2024-08-02 in 0.08 sec.
2025-11-14 16:23:29,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:29,097 - INFO - Going to convert document batch...
2025-11-14 16:23:29,098 - INFO - Processing document 4_2024-08-27
2025-11-14 16:23:29,122 - INFO - Finished converting document 4_2024-08-27 in 0.08 sec.


Converted 'data\edgar_documents\DHR\4_2024-07-29' --> 'data\processed_data\DHR\4_2024-07-29.md'
Converted 'data\edgar_documents\DHR\4_2024-08-02' --> 'data\processed_data\DHR\4_2024-08-02.md'


2025-11-14 16:23:29,176 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:29,189 - INFO - Going to convert document batch...
2025-11-14 16:23:29,190 - INFO - Processing document 4_2024-10-28
2025-11-14 16:23:29,213 - INFO - Finished converting document 4_2024-10-28 in 0.06 sec.
2025-11-14 16:23:29,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:29,296 - INFO - Going to convert document batch...
2025-11-14 16:23:29,297 - INFO - Processing document 4_2024-11-18
2025-11-14 16:23:29,324 - INFO - Finished converting document 4_2024-11-18 in 0.08 sec.


Converted 'data\edgar_documents\DHR\4_2024-08-27' --> 'data\processed_data\DHR\4_2024-08-27.md'
Converted 'data\edgar_documents\DHR\4_2024-10-28' --> 'data\processed_data\DHR\4_2024-10-28.md'


2025-11-14 16:23:29,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:29,392 - INFO - Going to convert document batch...
2025-11-14 16:23:29,393 - INFO - Processing document 4_2024-11-22
2025-11-14 16:23:29,425 - INFO - Finished converting document 4_2024-11-22 in 0.08 sec.


Converted 'data\edgar_documents\DHR\4_2024-11-18' --> 'data\processed_data\DHR\4_2024-11-18.md'
Converted 'data\edgar_documents\DHR\4_2024-11-22' --> 'data\processed_data\DHR\4_2024-11-22.md'


2025-11-14 16:23:29,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:29,581 - INFO - Going to convert document batch...
2025-11-14 16:23:29,583 - INFO - Processing document 4_2024-11-27
2025-11-14 16:23:29,612 - INFO - Finished converting document 4_2024-11-27 in 0.16 sec.
2025-11-14 16:23:29,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:29,697 - INFO - Going to convert document batch...
2025-11-14 16:23:29,698 - INFO - Processing document 4_2024-12-19
2025-11-14 16:23:29,721 - INFO - Finished converting document 4_2024-12-19 in 0.08 sec.
2025-11-14 16:23:29,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:29,794 - INFO - Going to convert document batch...
2025-11-14 16:23:29,796 - INFO - Processing document 4_2025-01-31
2025-11-14 16:23:29,822 - INFO - Finished converting document 4_2025-01-31 in 0.06 sec.


Converted 'data\edgar_documents\DHR\4_2024-11-27' --> 'data\processed_data\DHR\4_2024-11-27.md'
Converted 'data\edgar_documents\DHR\4_2024-12-19' --> 'data\processed_data\DHR\4_2024-12-19.md'


2025-11-14 16:23:29,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:29,887 - INFO - Going to convert document batch...
2025-11-14 16:23:29,888 - INFO - Processing document 4_2025-02-04
2025-11-14 16:23:29,924 - INFO - Finished converting document 4_2025-02-04 in 0.08 sec.
2025-11-14 16:23:29,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:29,999 - INFO - Going to convert document batch...
2025-11-14 16:23:30,000 - INFO - Processing document 4_2025-02-10


Converted 'data\edgar_documents\DHR\4_2025-01-31' --> 'data\processed_data\DHR\4_2025-01-31.md'
Converted 'data\edgar_documents\DHR\4_2025-02-04' --> 'data\processed_data\DHR\4_2025-02-04.md'


2025-11-14 16:23:30,030 - INFO - Finished converting document 4_2025-02-10 in 0.08 sec.
2025-11-14 16:23:30,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:30,092 - INFO - Going to convert document batch...
2025-11-14 16:23:30,092 - INFO - Processing document 4_2025-02-25
2025-11-14 16:23:30,121 - INFO - Finished converting document 4_2025-02-25 in 0.06 sec.
2025-11-14 16:23:30,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:30,207 - INFO - Going to convert document batch...
2025-11-14 16:23:30,208 - INFO - Processing document 4_2025-03-04
2025-11-14 16:23:30,228 - INFO - Finished converting document 4_2025-03-04 in 0.08 sec.


Converted 'data\edgar_documents\DHR\4_2025-02-10' --> 'data\processed_data\DHR\4_2025-02-10.md'
Converted 'data\edgar_documents\DHR\4_2025-02-25' --> 'data\processed_data\DHR\4_2025-02-25.md'


2025-11-14 16:23:30,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:30,293 - INFO - Going to convert document batch...
2025-11-14 16:23:30,294 - INFO - Processing document 4_2025-03-05
2025-11-14 16:23:30,335 - INFO - Finished converting document 4_2025-03-05 in 0.08 sec.
2025-11-14 16:23:30,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:30,417 - INFO - Going to convert document batch...
2025-11-14 16:23:30,418 - INFO - Processing document 4_2025-04-29


Converted 'data\edgar_documents\DHR\4_2025-03-04' --> 'data\processed_data\DHR\4_2025-03-04.md'
Converted 'data\edgar_documents\DHR\4_2025-03-05' --> 'data\processed_data\DHR\4_2025-03-05.md'


2025-11-14 16:23:30,438 - INFO - Finished converting document 4_2025-04-29 in 0.08 sec.
2025-11-14 16:23:30,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:30,507 - INFO - Going to convert document batch...
2025-11-14 16:23:30,508 - INFO - Processing document 4_2025-05-01
2025-11-14 16:23:30,539 - INFO - Finished converting document 4_2025-05-01 in 0.06 sec.
2025-11-14 16:23:30,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:30,585 - INFO - Going to convert document batch...
2025-11-14 16:23:30,586 - INFO - Processing document 4_2025-05-14
2025-11-14 16:23:30,615 - INFO - Finished converting document 4_2025-05-14 in 0.05 sec.


Converted 'data\edgar_documents\DHR\4_2025-04-29' --> 'data\processed_data\DHR\4_2025-04-29.md'
Converted 'data\edgar_documents\DHR\4_2025-05-01' --> 'data\processed_data\DHR\4_2025-05-01.md'
Converted 'data\edgar_documents\DHR\4_2025-05-14' --> 'data\processed_data\DHR\4_2025-05-14.md'


2025-11-14 16:23:30,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:30,681 - INFO - Going to convert document batch...
2025-11-14 16:23:30,683 - INFO - Processing document 4_2025-05-15
2025-11-14 16:23:30,791 - INFO - Finished converting document 4_2025-05-15 in 0.14 sec.
2025-11-14 16:23:30,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:30,891 - INFO - Going to convert document batch...
2025-11-14 16:23:30,892 - INFO - Processing document 4_2025-05-19
2025-11-14 16:23:30,915 - INFO - Finished converting document 4_2025-05-19 in 0.05 sec.
2025-11-14 16:23:30,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:30,982 - INFO - Going to convert document batch...
2025-11-14 16:23:30,984 - INFO - Processing document 4_2025-07-07
2025-11-14 16:23:31,009 - INFO - Finished converting document 4_2025-07-07 in 0.05 sec.


Converted 'data\edgar_documents\DHR\4_2025-05-15' --> 'data\processed_data\DHR\4_2025-05-15.md'
Converted 'data\edgar_documents\DHR\4_2025-05-19' --> 'data\processed_data\DHR\4_2025-05-19.md'
Converted 'data\edgar_documents\DHR\4_2025-07-07' --> 'data\processed_data\DHR\4_2025-07-07.md'


2025-11-14 16:23:31,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:31,083 - INFO - Going to convert document batch...
2025-11-14 16:23:31,085 - INFO - Processing document 4_2025-07-16
2025-11-14 16:23:31,131 - INFO - Finished converting document 4_2025-07-16 in 0.09 sec.
2025-11-14 16:23:31,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:31,216 - INFO - Going to convert document batch...
2025-11-14 16:23:31,217 - INFO - Processing document 4_2025-07-28
2025-11-14 16:23:31,235 - INFO - Finished converting document 4_2025-07-28 in 0.08 sec.
2025-11-14 16:23:31,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:31,319 - INFO - Going to convert document batch...
2025-11-14 16:23:31,319 - INFO - Processing document 4_2025-08-25
2025-11-14 16:23:31,342 - INFO - Finished converting document 4_2025-08-25 in 0.09 sec.


Converted 'data\edgar_documents\DHR\4_2025-07-16' --> 'data\processed_data\DHR\4_2025-07-16.md'
Converted 'data\edgar_documents\DHR\4_2025-07-28' --> 'data\processed_data\DHR\4_2025-07-28.md'


2025-11-14 16:23:31,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:31,416 - INFO - Going to convert document batch...
2025-11-14 16:23:31,417 - INFO - Processing document 4_2025-11-03
2025-11-14 16:23:31,438 - INFO - Finished converting document 4_2025-11-03 in 0.08 sec.
2025-11-14 16:23:31,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:31,489 - INFO - Going to convert document batch...
2025-11-14 16:23:31,490 - INFO - Processing document 4_2025-11-04


Converted 'data\edgar_documents\DHR\4_2025-08-25' --> 'data\processed_data\DHR\4_2025-08-25.md'
Converted 'data\edgar_documents\DHR\4_2025-11-03' --> 'data\processed_data\DHR\4_2025-11-03.md'


2025-11-14 16:23:31,845 - INFO - Finished converting document 4_2025-11-04 in 0.39 sec.
2025-11-14 16:23:32,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:32,020 - INFO - Going to convert document batch...
2025-11-14 16:23:32,021 - INFO - Processing document 8-K_2023-01-09
2025-11-14 16:23:32,043 - INFO - Finished converting document 8-K_2023-01-09 in 0.06 sec.
2025-11-14 16:23:32,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:32,120 - INFO - Going to convert document batch...
2025-11-14 16:23:32,121 - INFO - Processing document 8-K_2023-01-18


Converted 'data\edgar_documents\DHR\4_2025-11-04' --> 'data\processed_data\DHR\4_2025-11-04.md'
Converted 'data\edgar_documents\DHR\8-K_2023-01-09' --> 'data\processed_data\DHR\8-K_2023-01-09.md'


2025-11-14 16:23:32,157 - INFO - Finished converting document 8-K_2023-01-18 in 0.09 sec.
2025-11-14 16:23:32,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:32,224 - INFO - Going to convert document batch...
2025-11-14 16:23:32,225 - INFO - Processing document 8-K_2023-01-24
2025-11-14 16:23:32,248 - INFO - Finished converting document 8-K_2023-01-24 in 0.08 sec.
2025-11-14 16:23:32,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:32,301 - INFO - Going to convert document batch...
2025-11-14 16:23:32,302 - INFO - Processing document 8-K_2023-04-25
2025-11-14 16:23:32,331 - INFO - Finished converting document 8-K_2023-04-25 in 0.06 sec.
2025-11-14 16:23:32,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\8-K_2023-01-18' --> 'data\processed_data\DHR\8-K_2023-01-18.md'
Converted 'data\edgar_documents\DHR\8-K_2023-01-24' --> 'data\processed_data\DHR\8-K_2023-01-24.md'
Converted 'data\edgar_documents\DHR\8-K_2023-04-25' --> 'data\processed_data\DHR\8-K_2023-04-25.md'


2025-11-14 16:23:32,395 - INFO - Going to convert document batch...
2025-11-14 16:23:32,396 - INFO - Processing document 8-K_2023-05-11
2025-11-14 16:23:32,442 - INFO - Finished converting document 8-K_2023-05-11 in 0.09 sec.
2025-11-14 16:23:32,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:32,556 - INFO - Going to convert document batch...
2025-11-14 16:23:32,557 - INFO - Processing document 8-K_2023-07-25
2025-11-14 16:23:32,599 - INFO - Finished converting document 8-K_2023-07-25 in 0.12 sec.


Converted 'data\edgar_documents\DHR\8-K_2023-05-11' --> 'data\processed_data\DHR\8-K_2023-05-11.md'
Converted 'data\edgar_documents\DHR\8-K_2023-07-25' --> 'data\processed_data\DHR\8-K_2023-07-25.md'


2025-11-14 16:23:32,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:32,809 - INFO - Going to convert document batch...
2025-11-14 16:23:32,810 - INFO - Processing document 8-K_2023-08-15
2025-11-14 16:23:32,864 - INFO - Finished converting document 8-K_2023-08-15 in 0.25 sec.
2025-11-14 16:23:32,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:32,914 - INFO - Going to convert document batch...
2025-11-14 16:23:32,914 - INFO - Processing document 8-K_2023-08-31
2025-11-14 16:23:32,940 - INFO - Finished converting document 8-K_2023-08-31 in 0.06 sec.
2025-11-14 16:23:33,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:33,038 - INFO - Going to convert document batch...
2025-11-14 16:23:33,039 - INFO - Processing document 8-K_2023-09-12
2025-11-14 16:23:33,070 - INFO - Finished converting document 8-K_2023-09-12 in 0.11 sec.


Converted 'data\edgar_documents\DHR\8-K_2023-08-15' --> 'data\processed_data\DHR\8-K_2023-08-15.md'
Converted 'data\edgar_documents\DHR\8-K_2023-08-31' --> 'data\processed_data\DHR\8-K_2023-08-31.md'


2025-11-14 16:23:33,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:33,179 - INFO - Going to convert document batch...
2025-11-14 16:23:33,180 - INFO - Processing document 8-K_2023-09-19
2025-11-14 16:23:33,239 - INFO - Finished converting document 8-K_2023-09-19 in 0.16 sec.


Converted 'data\edgar_documents\DHR\8-K_2023-09-12' --> 'data\processed_data\DHR\8-K_2023-09-12.md'


2025-11-14 16:23:33,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:33,351 - INFO - Going to convert document batch...
2025-11-14 16:23:33,352 - INFO - Processing document 8-K_2023-10-02
2025-11-14 16:23:33,424 - INFO - Finished converting document 8-K_2023-10-02 in 0.16 sec.


Converted 'data\edgar_documents\DHR\8-K_2023-09-19' --> 'data\processed_data\DHR\8-K_2023-09-19.md'


2025-11-14 16:23:33,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:33,536 - INFO - Going to convert document batch...
2025-11-14 16:23:33,537 - INFO - Processing document 8-K_2023-10-24
2025-11-14 16:23:33,582 - INFO - Finished converting document 8-K_2023-10-24 in 0.12 sec.
2025-11-14 16:23:33,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:33,651 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\DHR\8-K_2023-10-02' --> 'data\processed_data\DHR\8-K_2023-10-02.md'
Converted 'data\edgar_documents\DHR\8-K_2023-10-24' --> 'data\processed_data\DHR\8-K_2023-10-24.md'


2025-11-14 16:23:33,653 - INFO - Processing document 8-K_2024-01-08
2025-11-14 16:23:33,688 - INFO - Finished converting document 8-K_2024-01-08 in 0.08 sec.
2025-11-14 16:23:33,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:33,759 - INFO - Going to convert document batch...
2025-11-14 16:23:33,760 - INFO - Processing document 8-K_2024-01-30
2025-11-14 16:23:33,792 - INFO - Finished converting document 8-K_2024-01-30 in 0.08 sec.
2025-11-14 16:23:33,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:33,871 - INFO - Going to convert document batch...
2025-11-14 16:23:33,873 - INFO - Processing document 8-K_2024-02-14
2025-11-14 16:23:33,913 - INFO - Finished converting document 8-K_2024-02-14 in 0.09 sec.


Converted 'data\edgar_documents\DHR\8-K_2024-01-08' --> 'data\processed_data\DHR\8-K_2024-01-08.md'
Converted 'data\edgar_documents\DHR\8-K_2024-01-30' --> 'data\processed_data\DHR\8-K_2024-01-30.md'


2025-11-14 16:23:33,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:33,968 - INFO - Going to convert document batch...
2025-11-14 16:23:33,968 - INFO - Processing document 8-K_2024-04-23
2025-11-14 16:23:34,003 - INFO - Finished converting document 8-K_2024-04-23 in 0.06 sec.
2025-11-14 16:23:34,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:34,075 - INFO - Going to convert document batch...
2025-11-14 16:23:34,076 - INFO - Processing document 8-K_2024-05-09
2025-11-14 16:23:34,123 - INFO - Finished converting document 8-K_2024-05-09 in 0.11 sec.


Converted 'data\edgar_documents\DHR\8-K_2024-02-14' --> 'data\processed_data\DHR\8-K_2024-02-14.md'
Converted 'data\edgar_documents\DHR\8-K_2024-04-23' --> 'data\processed_data\DHR\8-K_2024-04-23.md'


2025-11-14 16:23:34,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:34,240 - INFO - Going to convert document batch...
2025-11-14 16:23:34,247 - INFO - Processing document 8-K_2024-06-20


Converted 'data\edgar_documents\DHR\8-K_2024-05-09' --> 'data\processed_data\DHR\8-K_2024-05-09.md'


2025-11-14 16:23:34,365 - INFO - Finished converting document 8-K_2024-06-20 in 0.22 sec.
2025-11-14 16:23:34,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:34,501 - INFO - Going to convert document batch...
2025-11-14 16:23:34,549 - INFO - Processing document 8-K_2024-07-23


Converted 'data\edgar_documents\DHR\8-K_2024-06-20' --> 'data\processed_data\DHR\8-K_2024-06-20.md'


2025-11-14 16:23:34,764 - INFO - Finished converting document 8-K_2024-07-23 in 0.34 sec.
2025-11-14 16:23:34,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:34,925 - INFO - Going to convert document batch...
2025-11-14 16:23:34,927 - INFO - Processing document 8-K_2024-10-22
2025-11-14 16:23:35,002 - INFO - Finished converting document 8-K_2024-10-22 in 0.19 sec.


Converted 'data\edgar_documents\DHR\8-K_2024-07-23' --> 'data\processed_data\DHR\8-K_2024-07-23.md'


2025-11-14 16:23:35,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:35,135 - INFO - Going to convert document batch...
2025-11-14 16:23:35,138 - INFO - Processing document 8-K_2024-12-11
2025-11-14 16:23:35,206 - INFO - Finished converting document 8-K_2024-12-11 in 0.16 sec.


Converted 'data\edgar_documents\DHR\8-K_2024-10-22' --> 'data\processed_data\DHR\8-K_2024-10-22.md'


2025-11-14 16:23:35,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:35,310 - INFO - Going to convert document batch...
2025-11-14 16:23:35,311 - INFO - Processing document 8-K_2025-01-13
2025-11-14 16:23:35,386 - INFO - Finished converting document 8-K_2025-01-13 in 0.14 sec.


Converted 'data\edgar_documents\DHR\8-K_2024-12-11' --> 'data\processed_data\DHR\8-K_2024-12-11.md'
Converted 'data\edgar_documents\DHR\8-K_2025-01-13' --> 'data\processed_data\DHR\8-K_2025-01-13.md'


2025-11-14 16:23:35,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:35,532 - INFO - Going to convert document batch...
2025-11-14 16:23:35,533 - INFO - Processing document 8-K_2025-01-29
2025-11-14 16:23:35,599 - INFO - Finished converting document 8-K_2025-01-29 in 0.17 sec.
2025-11-14 16:23:35,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:35,701 - INFO - Going to convert document batch...
2025-11-14 16:23:35,701 - INFO - Processing document 8-K_2025-02-20
2025-11-14 16:23:35,762 - INFO - Finished converting document 8-K_2025-02-20 in 0.12 sec.


Converted 'data\edgar_documents\DHR\8-K_2025-01-29' --> 'data\processed_data\DHR\8-K_2025-01-29.md'
Converted 'data\edgar_documents\DHR\8-K_2025-02-20' --> 'data\processed_data\DHR\8-K_2025-02-20.md'


2025-11-14 16:23:35,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:35,901 - INFO - Going to convert document batch...
2025-11-14 16:23:35,903 - INFO - Processing document 8-K_2025-04-22
2025-11-14 16:23:35,972 - INFO - Finished converting document 8-K_2025-04-22 in 0.17 sec.
2025-11-14 16:23:36,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:36,132 - INFO - Going to convert document batch...
2025-11-14 16:23:36,134 - INFO - Processing document 8-K_2025-05-08


Converted 'data\edgar_documents\DHR\8-K_2025-04-22' --> 'data\processed_data\DHR\8-K_2025-04-22.md'


2025-11-14 16:23:36,255 - INFO - Finished converting document 8-K_2025-05-08 in 0.23 sec.
2025-11-14 16:23:36,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:36,439 - INFO - Going to convert document batch...
2025-11-14 16:23:36,440 - INFO - Processing document 8-K_2025-07-22
2025-11-14 16:23:36,515 - INFO - Finished converting document 8-K_2025-07-22 in 0.17 sec.


Converted 'data\edgar_documents\DHR\8-K_2025-05-08' --> 'data\processed_data\DHR\8-K_2025-05-08.md'


2025-11-14 16:23:36,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:36,694 - INFO - Going to convert document batch...
2025-11-14 16:23:36,695 - INFO - Processing document 8-K_2025-07-24


Converted 'data\edgar_documents\DHR\8-K_2025-07-22' --> 'data\processed_data\DHR\8-K_2025-07-22.md'


2025-11-14 16:23:36,825 - INFO - Finished converting document 8-K_2025-07-24 in 0.28 sec.
2025-11-14 16:23:36,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:36,995 - INFO - Going to convert document batch...
2025-11-14 16:23:36,996 - INFO - Processing document 8-K_2025-07-31
2025-11-14 16:23:37,072 - INFO - Finished converting document 8-K_2025-07-31 in 0.14 sec.


Converted 'data\edgar_documents\DHR\8-K_2025-07-24' --> 'data\processed_data\DHR\8-K_2025-07-24.md'


2025-11-14 16:23:37,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:37,221 - INFO - Going to convert document batch...
2025-11-14 16:23:37,222 - INFO - Processing document 8-K_2025-09-10


Converted 'data\edgar_documents\DHR\8-K_2025-07-31' --> 'data\processed_data\DHR\8-K_2025-07-31.md'


2025-11-14 16:23:37,336 - INFO - Finished converting document 8-K_2025-09-10 in 0.22 sec.
2025-11-14 16:23:37,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:37,484 - INFO - Going to convert document batch...
2025-11-14 16:23:37,487 - INFO - Processing document 8-K_2025-10-21
2025-11-14 16:23:37,564 - INFO - Finished converting document 8-K_2025-10-21 in 0.16 sec.


Converted 'data\edgar_documents\DHR\8-K_2025-09-10' --> 'data\processed_data\DHR\8-K_2025-09-10.md'


2025-11-14 16:23:37,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:23:37,701 - INFO - Going to convert document batch...
2025-11-14 16:23:37,704 - INFO - Processing document 8-K_2025-11-06


Converted 'data\edgar_documents\DHR\8-K_2025-10-21' --> 'data\processed_data\DHR\8-K_2025-10-21.md'


2025-11-14 16:23:38,031 - INFO - Finished converting document 8-K_2025-11-06 in 0.42 sec.
2025-11-14 16:23:38,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\8-K_2025-11-06' --> 'data\processed_data\DHR\8-K_2025-11-06.md'


2025-11-14 16:23:40,573 - INFO - Going to convert document batch...
2025-11-14 16:23:40,575 - INFO - Processing document DEF-14A_2023-03-29
2025-11-14 16:23:46,038 - INFO - Finished converting document DEF-14A_2023-03-29 in 7.94 sec.
2025-11-14 16:23:50,617 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\DEF-14A_2023-03-29' --> 'data\processed_data\DHR\DEF-14A_2023-03-29.md'


2025-11-14 16:23:52,913 - INFO - Going to convert document batch...
2025-11-14 16:23:52,916 - INFO - Processing document DEF-14A_2024-03-27
2025-11-14 16:23:58,639 - INFO - Finished converting document DEF-14A_2024-03-27 in 8.11 sec.
2025-11-14 16:24:02,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DHR\DEF-14A_2024-03-27' --> 'data\processed_data\DHR\DEF-14A_2024-03-27.md'


2025-11-14 16:24:04,607 - INFO - Going to convert document batch...
2025-11-14 16:24:04,608 - INFO - Processing document DEF-14A_2025-03-26
2025-11-14 16:24:13,405 - INFO - Finished converting document DEF-14A_2025-03-26 in 11.09 sec.
2025-11-14 16:24:17,454 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:24:17,456 - ERROR - Input document 10-K_2023-01-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:24:17,466 - INFO - Going to co

Converted 'data\edgar_documents\DHR\DEF-14A_2025-03-26' --> 'data\processed_data\DHR\DEF-14A_2025-03-26.md'
Processed 112 new files. Errors: 0
Found 121 files to process in data\edgar_documents\DIS
Error processing data\edgar_documents\DIS\10-K_2023-01-24: File format not allowed: data\edgar_documents\DIS\10-K_2023-01-24


2025-11-14 16:24:17,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:24:22,157 - INFO - Going to convert document batch...
2025-11-14 16:24:22,159 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:24:22,161 - INFO - Processing document 10-K_2023-11-21
2025-11-14 16:24:32,258 - INFO - Finished converting document 10-K_2023-11-21 in 14.78 sec.
2025-11-14 16:24:35,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-K_2023-11-21' --> 'data\processed_data\DIS\10-K_2023-11-21.md'


2025-11-14 16:24:37,024 - INFO - Going to convert document batch...
2025-11-14 16:24:37,026 - INFO - Processing document 10-K_2024-01-24
2025-11-14 16:24:40,444 - INFO - Finished converting document 10-K_2024-01-24 in 4.69 sec.
2025-11-14 16:24:42,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-K_2024-01-24' --> 'data\processed_data\DIS\10-K_2024-01-24.md'


2025-11-14 16:24:46,312 - INFO - Going to convert document batch...
2025-11-14 16:24:46,314 - INFO - Processing document 10-K_2024-11-14
2025-11-14 16:24:56,039 - INFO - Finished converting document 10-K_2024-11-14 in 13.38 sec.
2025-11-14 16:24:59,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-K_2024-11-14' --> 'data\processed_data\DIS\10-K_2024-11-14.md'


2025-11-14 16:25:01,636 - INFO - Going to convert document batch...
2025-11-14 16:25:01,639 - INFO - Processing document 10-Q_2023-02-08
2025-11-14 16:25:05,415 - INFO - Finished converting document 10-Q_2023-02-08 in 5.75 sec.
2025-11-14 16:25:07,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-Q_2023-02-08' --> 'data\processed_data\DIS\10-Q_2023-02-08.md'


2025-11-14 16:25:09,969 - INFO - Going to convert document batch...
2025-11-14 16:25:09,971 - INFO - Processing document 10-Q_2023-05-10
2025-11-14 16:25:15,917 - INFO - Finished converting document 10-Q_2023-05-10 in 8.70 sec.
2025-11-14 16:25:18,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-Q_2023-05-10' --> 'data\processed_data\DIS\10-Q_2023-05-10.md'


2025-11-14 16:25:22,149 - INFO - Going to convert document batch...
2025-11-14 16:25:22,151 - INFO - Processing document 10-Q_2023-08-09
2025-11-14 16:25:27,655 - INFO - Finished converting document 10-Q_2023-08-09 in 9.03 sec.
2025-11-14 16:25:30,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-Q_2023-08-09' --> 'data\processed_data\DIS\10-Q_2023-08-09.md'


2025-11-14 16:25:33,298 - INFO - Going to convert document batch...
2025-11-14 16:25:33,300 - INFO - Processing document 10-Q_2024-02-07
2025-11-14 16:25:36,811 - INFO - Finished converting document 10-Q_2024-02-07 in 6.11 sec.
2025-11-14 16:25:37,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-Q_2024-02-07' --> 'data\processed_data\DIS\10-Q_2024-02-07.md'


2025-11-14 16:25:41,162 - INFO - Going to convert document batch...
2025-11-14 16:25:41,163 - INFO - Processing document 10-Q_2024-05-07
2025-11-14 16:25:46,826 - INFO - Finished converting document 10-Q_2024-05-07 in 9.20 sec.
2025-11-14 16:25:49,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-Q_2024-05-07' --> 'data\processed_data\DIS\10-Q_2024-05-07.md'


2025-11-14 16:25:54,295 - INFO - Going to convert document batch...
2025-11-14 16:25:54,298 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 16:26:02,672 - INFO - Finished converting document 10-Q_2024-08-07 in 12.97 sec.
2025-11-14 16:26:06,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-Q_2024-08-07' --> 'data\processed_data\DIS\10-Q_2024-08-07.md'


2025-11-14 16:26:08,882 - INFO - Going to convert document batch...
2025-11-14 16:26:08,884 - INFO - Processing document 10-Q_2025-02-05
2025-11-14 16:26:13,397 - INFO - Finished converting document 10-Q_2025-02-05 in 7.16 sec.
2025-11-14 16:26:15,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-Q_2025-02-05' --> 'data\processed_data\DIS\10-Q_2025-02-05.md'


2025-11-14 16:26:19,352 - INFO - Going to convert document batch...
2025-11-14 16:26:19,353 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 16:26:26,680 - INFO - Finished converting document 10-Q_2025-05-07 in 11.03 sec.
2025-11-14 16:26:29,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\10-Q_2025-05-07' --> 'data\processed_data\DIS\10-Q_2025-05-07.md'


2025-11-14 16:26:32,461 - INFO - Going to convert document batch...
2025-11-14 16:26:32,464 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 16:26:38,509 - INFO - Finished converting document 10-Q_2025-08-06 in 9.22 sec.
2025-11-14 16:26:41,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:41,511 - INFO - Going to convert document batch...
2025-11-14 16:26:41,513 - INFO - Processing document 4_2023-01-04
2025-11-14 16:26:41,587 - INFO - Finished converting document 4_2023-01-04 in 0.19 sec.


Converted 'data\edgar_documents\DIS\10-Q_2025-08-06' --> 'data\processed_data\DIS\10-Q_2025-08-06.md'


2025-11-14 16:26:41,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:41,740 - INFO - Going to convert document batch...
2025-11-14 16:26:41,741 - INFO - Processing document 4_2023-01-13
2025-11-14 16:26:41,829 - INFO - Finished converting document 4_2023-01-13 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2023-01-04' --> 'data\processed_data\DIS\4_2023-01-04.md'


2025-11-14 16:26:41,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:41,995 - INFO - Going to convert document batch...
2025-11-14 16:26:41,997 - INFO - Processing document 4_2023-01-25
2025-11-14 16:26:42,064 - INFO - Finished converting document 4_2023-01-25 in 0.16 sec.


Converted 'data\edgar_documents\DIS\4_2023-01-13' --> 'data\processed_data\DIS\4_2023-01-13.md'


2025-11-14 16:26:42,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:42,267 - INFO - Going to convert document batch...
2025-11-14 16:26:42,269 - INFO - Processing document 4_2023-02-22


Converted 'data\edgar_documents\DIS\4_2023-01-25' --> 'data\processed_data\DIS\4_2023-01-25.md'


2025-11-14 16:26:42,350 - INFO - Finished converting document 4_2023-02-22 in 0.20 sec.
2025-11-14 16:26:42,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:42,485 - INFO - Going to convert document batch...
2025-11-14 16:26:42,487 - INFO - Processing document 4_2023-03-09
2025-11-14 16:26:42,585 - INFO - Finished converting document 4_2023-03-09 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2023-02-22' --> 'data\processed_data\DIS\4_2023-02-22.md'


2025-11-14 16:26:42,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:42,713 - INFO - Going to convert document batch...
2025-11-14 16:26:42,714 - INFO - Processing document 4_2023-03-22
2025-11-14 16:26:42,801 - INFO - Finished converting document 4_2023-03-22 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2023-03-09' --> 'data\processed_data\DIS\4_2023-03-09.md'


2025-11-14 16:26:42,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:42,978 - INFO - Going to convert document batch...
2025-11-14 16:26:42,980 - INFO - Processing document 4_2023-04-04
2025-11-14 16:26:43,045 - INFO - Finished converting document 4_2023-04-04 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2023-03-22' --> 'data\processed_data\DIS\4_2023-03-22.md'


2025-11-14 16:26:43,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:43,223 - INFO - Going to convert document batch...
2025-11-14 16:26:43,225 - INFO - Processing document 4_2023-04-25
2025-11-14 16:26:43,306 - INFO - Finished converting document 4_2023-04-25 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2023-04-04' --> 'data\processed_data\DIS\4_2023-04-04.md'


2025-11-14 16:26:43,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:43,472 - INFO - Going to convert document batch...
2025-11-14 16:26:43,475 - INFO - Processing document 4_2023-06-16


Converted 'data\edgar_documents\DIS\4_2023-04-25' --> 'data\processed_data\DIS\4_2023-04-25.md'


2025-11-14 16:26:43,646 - INFO - Finished converting document 4_2023-06-16 in 0.23 sec.
2025-11-14 16:26:43,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:43,815 - INFO - Going to convert document batch...
2025-11-14 16:26:43,817 - INFO - Processing document 4_2023-06-23
2025-11-14 16:26:43,901 - INFO - Finished converting document 4_2023-06-23 in 0.16 sec.


Converted 'data\edgar_documents\DIS\4_2023-06-16' --> 'data\processed_data\DIS\4_2023-06-16.md'


2025-11-14 16:26:44,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:44,058 - INFO - Going to convert document batch...
2025-11-14 16:26:44,060 - INFO - Processing document 4_2023-06-27
2025-11-14 16:26:44,129 - INFO - Finished converting document 4_2023-06-27 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2023-06-23' --> 'data\processed_data\DIS\4_2023-06-23.md'


2025-11-14 16:26:44,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:44,336 - INFO - Going to convert document batch...
2025-11-14 16:26:44,338 - INFO - Processing document 4_2023-06-28
2025-11-14 16:26:44,421 - INFO - Finished converting document 4_2023-06-28 in 0.19 sec.


Converted 'data\edgar_documents\DIS\4_2023-06-27' --> 'data\processed_data\DIS\4_2023-06-27.md'


2025-11-14 16:26:44,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:44,589 - INFO - Going to convert document batch...
2025-11-14 16:26:44,591 - INFO - Processing document 4_2023-07-05
2025-11-14 16:26:44,662 - INFO - Finished converting document 4_2023-07-05 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2023-06-28' --> 'data\processed_data\DIS\4_2023-06-28.md'


2025-11-14 16:26:44,818 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:44,856 - INFO - Going to convert document batch...
2025-11-14 16:26:44,858 - INFO - Processing document 4_2023-07-19
2025-11-14 16:26:44,942 - INFO - Finished converting document 4_2023-07-19 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2023-07-05' --> 'data\processed_data\DIS\4_2023-07-05.md'


2025-11-14 16:26:45,071 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:45,129 - INFO - Going to convert document batch...
2025-11-14 16:26:45,132 - INFO - Processing document 4_2023-08-03


Converted 'data\edgar_documents\DIS\4_2023-07-19' --> 'data\processed_data\DIS\4_2023-07-19.md'


2025-11-14 16:26:45,278 - INFO - Finished converting document 4_2023-08-03 in 0.27 sec.
2025-11-14 16:26:45,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:45,495 - INFO - Going to convert document batch...
2025-11-14 16:26:45,497 - INFO - Processing document 4_2023-09-29
2025-11-14 16:26:45,579 - INFO - Finished converting document 4_2023-09-29 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2023-08-03' --> 'data\processed_data\DIS\4_2023-08-03.md'


2025-11-14 16:26:45,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:45,720 - INFO - Going to convert document batch...
2025-11-14 16:26:45,721 - INFO - Processing document 4_2023-10-03
2025-11-14 16:26:45,805 - INFO - Finished converting document 4_2023-10-03 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2023-09-29' --> 'data\processed_data\DIS\4_2023-09-29.md'


2025-11-14 16:26:45,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:45,934 - INFO - Going to convert document batch...
2025-11-14 16:26:45,936 - INFO - Processing document 4_2023-11-29
2025-11-14 16:26:46,010 - INFO - Finished converting document 4_2023-11-29 in 0.12 sec.


Converted 'data\edgar_documents\DIS\4_2023-10-03' --> 'data\processed_data\DIS\4_2023-10-03.md'


2025-11-14 16:26:46,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:46,193 - INFO - Going to convert document batch...
2025-11-14 16:26:46,195 - INFO - Processing document 4_2023-12-08
2025-11-14 16:26:46,278 - INFO - Finished converting document 4_2023-12-08 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2023-11-29' --> 'data\processed_data\DIS\4_2023-11-29.md'


2025-11-14 16:26:46,413 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:46,453 - INFO - Going to convert document batch...
2025-11-14 16:26:46,454 - INFO - Processing document 4_2023-12-15
2025-11-14 16:26:46,547 - INFO - Finished converting document 4_2023-12-15 in 0.19 sec.


Converted 'data\edgar_documents\DIS\4_2023-12-08' --> 'data\processed_data\DIS\4_2023-12-08.md'


2025-11-14 16:26:46,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:46,742 - INFO - Going to convert document batch...
2025-11-14 16:26:46,745 - INFO - Processing document 4_2023-12-19


Converted 'data\edgar_documents\DIS\4_2023-12-15' --> 'data\processed_data\DIS\4_2023-12-15.md'


2025-11-14 16:26:46,914 - INFO - Finished converting document 4_2023-12-19 in 0.25 sec.
2025-11-14 16:26:47,059 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:47,102 - INFO - Going to convert document batch...
2025-11-14 16:26:47,104 - INFO - Processing document 4_2023-12-20
2025-11-14 16:26:47,212 - INFO - Finished converting document 4_2023-12-20 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2023-12-19' --> 'data\processed_data\DIS\4_2023-12-19.md'


2025-11-14 16:26:47,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\4_2023-12-20' --> 'data\processed_data\DIS\4_2023-12-20.md'


2025-11-14 16:26:48,338 - INFO - Going to convert document batch...
2025-11-14 16:26:48,340 - INFO - Processing document 4_2023-12-29
2025-11-14 16:26:48,451 - INFO - Finished converting document 4_2023-12-29 in 1.14 sec.
2025-11-14 16:26:48,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:48,661 - INFO - Going to convert document batch...
2025-11-14 16:26:48,662 - INFO - Processing document 4_2024-01-02
2025-11-14 16:26:48,750 - INFO - Finished converting document 4_2024-01-02 in 0.19 sec.


Converted 'data\edgar_documents\DIS\4_2023-12-29' --> 'data\processed_data\DIS\4_2023-12-29.md'


2025-11-14 16:26:48,932 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:48,964 - INFO - Going to convert document batch...
2025-11-14 16:26:48,966 - INFO - Processing document 4_2024-01-12
2025-11-14 16:26:49,053 - INFO - Finished converting document 4_2024-01-12 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2024-01-02' --> 'data\processed_data\DIS\4_2024-01-02.md'


2025-11-14 16:26:49,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:49,237 - INFO - Going to convert document batch...
2025-11-14 16:26:49,239 - INFO - Processing document 4_2024-01-18
2025-11-14 16:26:49,337 - INFO - Finished converting document 4_2024-01-18 in 0.19 sec.


Converted 'data\edgar_documents\DIS\4_2024-01-12' --> 'data\processed_data\DIS\4_2024-01-12.md'


2025-11-14 16:26:49,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:49,496 - INFO - Going to convert document batch...
2025-11-14 16:26:49,497 - INFO - Processing document 4_2024-02-20
2025-11-14 16:26:49,595 - INFO - Finished converting document 4_2024-02-20 in 0.16 sec.


Converted 'data\edgar_documents\DIS\4_2024-01-18' --> 'data\processed_data\DIS\4_2024-01-18.md'


2025-11-14 16:26:49,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:49,741 - INFO - Going to convert document batch...
2025-11-14 16:26:49,743 - INFO - Processing document 4_2024-03-12
2025-11-14 16:26:49,818 - INFO - Finished converting document 4_2024-03-12 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2024-02-20' --> 'data\processed_data\DIS\4_2024-02-20.md'


2025-11-14 16:26:49,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:49,995 - INFO - Going to convert document batch...
2025-11-14 16:26:49,998 - INFO - Processing document 4_2024-04-02
2025-11-14 16:26:50,085 - INFO - Finished converting document 4_2024-04-02 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2024-03-12' --> 'data\processed_data\DIS\4_2024-03-12.md'


2025-11-14 16:26:50,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:50,234 - INFO - Going to convert document batch...
2025-11-14 16:26:50,236 - INFO - Processing document 4_2024-05-09
2025-11-14 16:26:50,302 - INFO - Finished converting document 4_2024-05-09 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2024-04-02' --> 'data\processed_data\DIS\4_2024-04-02.md'


2025-11-14 16:26:50,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:50,470 - INFO - Going to convert document batch...
2025-11-14 16:26:50,472 - INFO - Processing document 4_2024-06-18
2025-11-14 16:26:50,570 - INFO - Finished converting document 4_2024-06-18 in 0.20 sec.


Converted 'data\edgar_documents\DIS\4_2024-05-09' --> 'data\processed_data\DIS\4_2024-05-09.md'


2025-11-14 16:26:50,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:50,709 - INFO - Going to convert document batch...
2025-11-14 16:26:50,713 - INFO - Processing document 4_2024-06-25
2025-11-14 16:26:50,802 - INFO - Finished converting document 4_2024-06-25 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2024-06-18' --> 'data\processed_data\DIS\4_2024-06-18.md'


2025-11-14 16:26:50,950 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:50,981 - INFO - Going to convert document batch...
2025-11-14 16:26:50,984 - INFO - Processing document 4_2024-06-28
2025-11-14 16:26:51,062 - INFO - Finished converting document 4_2024-06-28 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2024-06-25' --> 'data\processed_data\DIS\4_2024-06-25.md'


2025-11-14 16:26:51,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:51,200 - INFO - Going to convert document batch...
2025-11-14 16:26:51,202 - INFO - Processing document 4_2024-07-02
2025-11-14 16:26:51,265 - INFO - Finished converting document 4_2024-07-02 in 0.11 sec.


Converted 'data\edgar_documents\DIS\4_2024-06-28' --> 'data\processed_data\DIS\4_2024-06-28.md'
Converted 'data\edgar_documents\DIS\4_2024-07-02' --> 'data\processed_data\DIS\4_2024-07-02.md'


2025-11-14 16:26:51,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:51,419 - INFO - Going to convert document batch...
2025-11-14 16:26:51,421 - INFO - Processing document 4_2024-07-18
2025-11-14 16:26:51,495 - INFO - Finished converting document 4_2024-07-18 in 0.17 sec.
2025-11-14 16:26:51,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:51,606 - INFO - Going to convert document batch...
2025-11-14 16:26:51,608 - INFO - Processing document 4_2024-08-09
2025-11-14 16:26:51,673 - INFO - Finished converting document 4_2024-08-09 in 0.11 sec.
2025-11-14 16:26:51,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\4_2024-07-18' --> 'data\processed_data\DIS\4_2024-07-18.md'
Converted 'data\edgar_documents\DIS\4_2024-08-09' --> 'data\processed_data\DIS\4_2024-08-09.md'


2025-11-14 16:26:51,784 - INFO - Going to convert document batch...
2025-11-14 16:26:51,785 - INFO - Processing document 4_2024-09-25
2025-11-14 16:26:51,847 - INFO - Finished converting document 4_2024-09-25 in 0.11 sec.
2025-11-14 16:26:51,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:52,003 - INFO - Going to convert document batch...
2025-11-14 16:26:52,005 - INFO - Processing document 4_2024-09-30
2025-11-14 16:26:52,096 - INFO - Finished converting document 4_2024-09-30 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2024-09-25' --> 'data\processed_data\DIS\4_2024-09-25.md'


2025-11-14 16:26:52,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:52,236 - INFO - Going to convert document batch...
2025-11-14 16:26:52,238 - INFO - Processing document 4_2024-10-02
2025-11-14 16:26:52,293 - INFO - Finished converting document 4_2024-10-02 in 0.12 sec.


Converted 'data\edgar_documents\DIS\4_2024-09-30' --> 'data\processed_data\DIS\4_2024-09-30.md'


2025-11-14 16:26:52,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:52,465 - INFO - Going to convert document batch...
2025-11-14 16:26:52,468 - INFO - Processing document 4_2024-11-01
2025-11-14 16:26:52,554 - INFO - Finished converting document 4_2024-11-01 in 0.16 sec.


Converted 'data\edgar_documents\DIS\4_2024-10-02' --> 'data\processed_data\DIS\4_2024-10-02.md'


2025-11-14 16:26:52,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:52,836 - INFO - Going to convert document batch...
2025-11-14 16:26:52,837 - INFO - Processing document 4_2024-11-12


Converted 'data\edgar_documents\DIS\4_2024-11-01' --> 'data\processed_data\DIS\4_2024-11-01.md'


2025-11-14 16:26:52,914 - INFO - Finished converting document 4_2024-11-12 in 0.23 sec.
2025-11-14 16:26:53,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:53,058 - INFO - Going to convert document batch...
2025-11-14 16:26:53,060 - INFO - Processing document 4_2024-11-21
2025-11-14 16:26:53,158 - INFO - Finished converting document 4_2024-11-21 in 0.16 sec.


Converted 'data\edgar_documents\DIS\4_2024-11-12' --> 'data\processed_data\DIS\4_2024-11-12.md'


2025-11-14 16:26:53,238 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:53,273 - INFO - Going to convert document batch...
2025-11-14 16:26:53,275 - INFO - Processing document 4_2024-11-22
2025-11-14 16:26:53,368 - INFO - Finished converting document 4_2024-11-22 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2024-11-21' --> 'data\processed_data\DIS\4_2024-11-21.md'


2025-11-14 16:26:53,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:53,496 - INFO - Going to convert document batch...
2025-11-14 16:26:53,498 - INFO - Processing document 4_2024-12-03
2025-11-14 16:26:53,572 - INFO - Finished converting document 4_2024-12-03 in 0.11 sec.


Converted 'data\edgar_documents\DIS\4_2024-11-22' --> 'data\processed_data\DIS\4_2024-11-22.md'
Converted 'data\edgar_documents\DIS\4_2024-12-03' --> 'data\processed_data\DIS\4_2024-12-03.md'


2025-11-14 16:26:53,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:53,721 - INFO - Going to convert document batch...
2025-11-14 16:26:53,724 - INFO - Processing document 4_2024-12-12
2025-11-14 16:26:53,817 - INFO - Finished converting document 4_2024-12-12 in 0.17 sec.
2025-11-14 16:26:53,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:53,971 - INFO - Going to convert document batch...
2025-11-14 16:26:53,973 - INFO - Processing document 4_2024-12-17


Converted 'data\edgar_documents\DIS\4_2024-12-12' --> 'data\processed_data\DIS\4_2024-12-12.md'


2025-11-14 16:26:54,113 - INFO - Finished converting document 4_2024-12-17 in 0.20 sec.
2025-11-14 16:26:54,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:54,273 - INFO - Going to convert document batch...
2025-11-14 16:26:54,275 - INFO - Processing document 4_2024-12-18
2025-11-14 16:26:54,356 - INFO - Finished converting document 4_2024-12-18 in 0.12 sec.


Converted 'data\edgar_documents\DIS\4_2024-12-17' --> 'data\processed_data\DIS\4_2024-12-17.md'


2025-11-14 16:26:54,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:54,535 - INFO - Going to convert document batch...
2025-11-14 16:26:54,537 - INFO - Processing document 4_2024-12-20


Converted 'data\edgar_documents\DIS\4_2024-12-18' --> 'data\processed_data\DIS\4_2024-12-18.md'


2025-11-14 16:26:54,652 - INFO - Finished converting document 4_2024-12-20 in 0.22 sec.
2025-11-14 16:26:54,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:54,803 - INFO - Going to convert document batch...
2025-11-14 16:26:54,805 - INFO - Processing document 4_2024-12-30
2025-11-14 16:26:54,882 - INFO - Finished converting document 4_2024-12-30 in 0.12 sec.


Converted 'data\edgar_documents\DIS\4_2024-12-20' --> 'data\processed_data\DIS\4_2024-12-20.md'
Converted 'data\edgar_documents\DIS\4_2024-12-30' --> 'data\processed_data\DIS\4_2024-12-30.md'


2025-11-14 16:26:55,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:55,062 - INFO - Going to convert document batch...
2025-11-14 16:26:55,065 - INFO - Processing document 4_2025-01-02
2025-11-14 16:26:55,142 - INFO - Finished converting document 4_2025-01-02 in 0.19 sec.
2025-11-14 16:26:55,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:55,252 - INFO - Going to convert document batch...
2025-11-14 16:26:55,254 - INFO - Processing document 4_2025-01-17
2025-11-14 16:26:55,316 - INFO - Finished converting document 4_2025-01-17 in 0.11 sec.


Converted 'data\edgar_documents\DIS\4_2025-01-02' --> 'data\processed_data\DIS\4_2025-01-02.md'
Converted 'data\edgar_documents\DIS\4_2025-01-17' --> 'data\processed_data\DIS\4_2025-01-17.md'


2025-11-14 16:26:55,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:55,457 - INFO - Going to convert document batch...
2025-11-14 16:26:55,459 - INFO - Processing document 4_2025-01-21
2025-11-14 16:26:55,555 - INFO - Finished converting document 4_2025-01-21 in 0.17 sec.
2025-11-14 16:26:55,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:55,738 - INFO - Going to convert document batch...
2025-11-14 16:26:55,739 - INFO - Processing document 4_2025-01-22
2025-11-14 16:26:55,797 - INFO - Finished converting document 4_2025-01-22 in 0.16 sec.


Converted 'data\edgar_documents\DIS\4_2025-01-21' --> 'data\processed_data\DIS\4_2025-01-21.md'


2025-11-14 16:26:55,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:55,886 - INFO - Going to convert document batch...
2025-11-14 16:26:55,887 - INFO - Processing document 4_2025-04-02
2025-11-14 16:26:55,933 - INFO - Finished converting document 4_2025-04-02 in 0.09 sec.


Converted 'data\edgar_documents\DIS\4_2025-01-22' --> 'data\processed_data\DIS\4_2025-01-22.md'
Converted 'data\edgar_documents\DIS\4_2025-04-02' --> 'data\processed_data\DIS\4_2025-04-02.md'


2025-11-14 16:26:56,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:56,103 - INFO - Going to convert document batch...
2025-11-14 16:26:56,105 - INFO - Processing document 4_2025-05-13
2025-11-14 16:26:56,189 - INFO - Finished converting document 4_2025-05-13 in 0.14 sec.
2025-11-14 16:26:56,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:56,374 - INFO - Going to convert document batch...
2025-11-14 16:26:56,375 - INFO - Processing document 4_2025-06-17
2025-11-14 16:26:56,470 - INFO - Finished converting document 4_2025-06-17 in 0.19 sec.


Converted 'data\edgar_documents\DIS\4_2025-05-13' --> 'data\processed_data\DIS\4_2025-05-13.md'


2025-11-14 16:26:56,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:56,593 - INFO - Going to convert document batch...
2025-11-14 16:26:56,594 - INFO - Processing document 4_2025-06-24
2025-11-14 16:26:56,684 - INFO - Finished converting document 4_2025-06-24 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2025-06-17' --> 'data\processed_data\DIS\4_2025-06-17.md'


2025-11-14 16:26:56,906 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:56,932 - INFO - Going to convert document batch...
2025-11-14 16:26:56,935 - INFO - Processing document 4_2025-06-30


Converted 'data\edgar_documents\DIS\4_2025-06-24' --> 'data\processed_data\DIS\4_2025-06-24.md'


2025-11-14 16:26:57,022 - INFO - Finished converting document 4_2025-06-30 in 0.25 sec.
2025-11-14 16:26:57,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:57,173 - INFO - Going to convert document batch...
2025-11-14 16:26:57,175 - INFO - Processing document 4_2025-07-02
2025-11-14 16:26:57,252 - INFO - Finished converting document 4_2025-07-02 in 0.12 sec.


Converted 'data\edgar_documents\DIS\4_2025-06-30' --> 'data\processed_data\DIS\4_2025-06-30.md'


2025-11-14 16:26:57,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:57,400 - INFO - Going to convert document batch...
2025-11-14 16:26:57,402 - INFO - Processing document 4_2025-07-16
2025-11-14 16:26:57,507 - INFO - Finished converting document 4_2025-07-16 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2025-07-02' --> 'data\processed_data\DIS\4_2025-07-02.md'


2025-11-14 16:26:57,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:57,644 - INFO - Going to convert document batch...
2025-11-14 16:26:57,645 - INFO - Processing document 4_2025-07-18
2025-11-14 16:26:57,746 - INFO - Finished converting document 4_2025-07-18 in 0.16 sec.


Converted 'data\edgar_documents\DIS\4_2025-07-16' --> 'data\processed_data\DIS\4_2025-07-16.md'


2025-11-14 16:26:57,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:57,893 - INFO - Going to convert document batch...
2025-11-14 16:26:57,895 - INFO - Processing document 4_2025-08-25
2025-11-14 16:26:57,978 - INFO - Finished converting document 4_2025-08-25 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2025-07-18' --> 'data\processed_data\DIS\4_2025-07-18.md'


2025-11-14 16:26:58,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:58,111 - INFO - Going to convert document batch...
2025-11-14 16:26:58,113 - INFO - Processing document 4_2025-09-23
2025-11-14 16:26:58,210 - INFO - Finished converting document 4_2025-09-23 in 0.14 sec.


Converted 'data\edgar_documents\DIS\4_2025-08-25' --> 'data\processed_data\DIS\4_2025-08-25.md'


2025-11-14 16:26:58,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:58,387 - INFO - Going to convert document batch...
2025-11-14 16:26:58,389 - INFO - Processing document 4_2025-09-24
2025-11-14 16:26:58,497 - INFO - Finished converting document 4_2025-09-24 in 0.19 sec.


Converted 'data\edgar_documents\DIS\4_2025-09-23' --> 'data\processed_data\DIS\4_2025-09-23.md'


2025-11-14 16:26:58,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:58,643 - INFO - Going to convert document batch...
2025-11-14 16:26:58,646 - INFO - Processing document 4_2025-09-30
2025-11-14 16:26:58,763 - INFO - Finished converting document 4_2025-09-30 in 0.19 sec.


Converted 'data\edgar_documents\DIS\4_2025-09-24' --> 'data\processed_data\DIS\4_2025-09-24.md'


2025-11-14 16:26:58,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:58,956 - INFO - Going to convert document batch...
2025-11-14 16:26:58,959 - INFO - Processing document 4_2025-10-02
2025-11-14 16:26:59,030 - INFO - Finished converting document 4_2025-10-02 in 0.17 sec.


Converted 'data\edgar_documents\DIS\4_2025-09-30' --> 'data\processed_data\DIS\4_2025-09-30.md'


2025-11-14 16:26:59,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:59,220 - INFO - Going to convert document batch...
2025-11-14 16:26:59,222 - INFO - Processing document 8-K_2023-02-08


Converted 'data\edgar_documents\DIS\4_2025-10-02' --> 'data\processed_data\DIS\4_2025-10-02.md'


2025-11-14 16:26:59,318 - INFO - Finished converting document 8-K_2023-02-08 in 0.20 sec.
2025-11-14 16:26:59,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:59,448 - INFO - Going to convert document batch...
2025-11-14 16:26:59,450 - INFO - Processing document 8-K_2023-03-07
2025-11-14 16:26:59,525 - INFO - Finished converting document 8-K_2023-03-07 in 0.16 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-02-08' --> 'data\processed_data\DIS\8-K_2023-02-08.md'


2025-11-14 16:26:59,587 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:26:59,619 - INFO - Going to convert document batch...
2025-11-14 16:26:59,622 - INFO - Processing document 8-K_2023-03-13
2025-11-14 16:26:59,682 - INFO - Finished converting document 8-K_2023-03-13 in 0.12 sec.
2025-11-14 16:26:59,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\8-K_2023-03-07' --> 'data\processed_data\DIS\8-K_2023-03-07.md'
Converted 'data\edgar_documents\DIS\8-K_2023-03-13' --> 'data\processed_data\DIS\8-K_2023-03-13.md'


2025-11-14 16:26:59,865 - INFO - Going to convert document batch...
2025-11-14 16:26:59,867 - INFO - Processing document 8-K_2023-04-04
2025-11-14 16:27:00,076 - INFO - Finished converting document 8-K_2023-04-04 in 0.36 sec.
2025-11-14 16:27:00,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:00,232 - INFO - Going to convert document batch...
2025-11-14 16:27:00,233 - INFO - Processing document 8-K_2023-04-20
2025-11-14 16:27:00,311 - INFO - Finished converting document 8-K_2023-04-20 in 0.14 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-04-04' --> 'data\processed_data\DIS\8-K_2023-04-04.md'
Converted 'data\edgar_documents\DIS\8-K_2023-04-20' --> 'data\processed_data\DIS\8-K_2023-04-20.md'


2025-11-14 16:27:00,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:00,450 - INFO - Going to convert document batch...
2025-11-14 16:27:00,451 - INFO - Processing document 8-K_2023-05-10
2025-11-14 16:27:00,948 - INFO - Finished converting document 8-K_2023-05-10 in 0.61 sec.
2025-11-14 16:27:01,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:01,084 - INFO - Going to convert document batch...
2025-11-14 16:27:01,085 - INFO - Processing document 8-K_2023-06-02
2025-11-14 16:27:01,149 - INFO - Finished converting document 8-K_2023-06-02 in 0.16 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-05-10' --> 'data\processed_data\DIS\8-K_2023-05-10.md'


2025-11-14 16:27:01,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:01,278 - INFO - Going to convert document batch...
2025-11-14 16:27:01,280 - INFO - Processing document 8-K_2023-06-12
2025-11-14 16:27:01,339 - INFO - Finished converting document 8-K_2023-06-12 in 0.16 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-06-02' --> 'data\processed_data\DIS\8-K_2023-06-02.md'
Converted 'data\edgar_documents\DIS\8-K_2023-06-12' --> 'data\processed_data\DIS\8-K_2023-06-12.md'


2025-11-14 16:27:01,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:01,473 - INFO - Going to convert document batch...
2025-11-14 16:27:01,476 - INFO - Processing document 8-K_2023-06-15
2025-11-14 16:27:01,554 - INFO - Finished converting document 8-K_2023-06-15 in 0.17 sec.
2025-11-14 16:27:01,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:01,692 - INFO - Going to convert document batch...
2025-11-14 16:27:01,694 - INFO - Processing document 8-K_2023-07-12
2025-11-14 16:27:01,766 - INFO - Finished converting document 8-K_2023-07-12 in 0.17 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-06-15' --> 'data\processed_data\DIS\8-K_2023-06-15.md'


2025-11-14 16:27:01,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:01,923 - INFO - Going to convert document batch...
2025-11-14 16:27:01,924 - INFO - Processing document 8-K_2023-08-09


Converted 'data\edgar_documents\DIS\8-K_2023-07-12' --> 'data\processed_data\DIS\8-K_2023-07-12.md'


2025-11-14 16:27:02,015 - INFO - Finished converting document 8-K_2023-08-09 in 0.22 sec.
2025-11-14 16:27:02,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:02,134 - INFO - Going to convert document batch...
2025-11-14 16:27:02,138 - INFO - Processing document 8-K_2023-09-08
2025-11-14 16:27:02,228 - INFO - Finished converting document 8-K_2023-09-08 in 0.14 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-08-09' --> 'data\processed_data\DIS\8-K_2023-08-09.md'
Converted 'data\edgar_documents\DIS\8-K_2023-09-08' --> 'data\processed_data\DIS\8-K_2023-09-08.md'


2025-11-14 16:27:02,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:02,382 - INFO - Going to convert document batch...
2025-11-14 16:27:02,384 - INFO - Processing document 8-K_2023-09-19
2025-11-14 16:27:02,483 - INFO - Finished converting document 8-K_2023-09-19 in 0.22 sec.
2025-11-14 16:27:02,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:02,622 - INFO - Going to convert document batch...
2025-11-14 16:27:02,623 - INFO - Processing document 8-K_2023-10-18
2025-11-14 16:27:02,698 - INFO - Finished converting document 8-K_2023-10-18 in 0.17 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-09-19' --> 'data\processed_data\DIS\8-K_2023-09-19.md'


2025-11-14 16:27:02,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:02,862 - INFO - Going to convert document batch...
2025-11-14 16:27:02,864 - INFO - Processing document 8-K_2023-11-01


Converted 'data\edgar_documents\DIS\8-K_2023-10-18' --> 'data\processed_data\DIS\8-K_2023-10-18.md'


2025-11-14 16:27:02,949 - INFO - Finished converting document 8-K_2023-11-01 in 0.22 sec.
2025-11-14 16:27:03,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:03,097 - INFO - Going to convert document batch...
2025-11-14 16:27:03,098 - INFO - Processing document 8-K_2023-11-06
2025-11-14 16:27:03,173 - INFO - Finished converting document 8-K_2023-11-06 in 0.17 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-11-01' --> 'data\processed_data\DIS\8-K_2023-11-01.md'


2025-11-14 16:27:03,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:03,330 - INFO - Going to convert document batch...
2025-11-14 16:27:03,332 - INFO - Processing document 8-K_2023-11-08


Converted 'data\edgar_documents\DIS\8-K_2023-11-06' --> 'data\processed_data\DIS\8-K_2023-11-06.md'


2025-11-14 16:27:03,411 - INFO - Finished converting document 8-K_2023-11-08 in 0.19 sec.
2025-11-14 16:27:03,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:03,498 - INFO - Going to convert document batch...
2025-11-14 16:27:03,499 - INFO - Processing document 8-K_2023-11-29
2025-11-14 16:27:03,568 - INFO - Finished converting document 8-K_2023-11-29 in 0.11 sec.
2025-11-14 16:27:03,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\8-K_2023-11-08' --> 'data\processed_data\DIS\8-K_2023-11-08.md'
Converted 'data\edgar_documents\DIS\8-K_2023-11-29' --> 'data\processed_data\DIS\8-K_2023-11-29.md'


2025-11-14 16:27:03,693 - INFO - Going to convert document batch...
2025-11-14 16:27:03,694 - INFO - Processing document 8-K_2023-11-30
2025-11-14 16:27:03,766 - INFO - Finished converting document 8-K_2023-11-30 in 0.16 sec.
2025-11-14 16:27:03,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:03,885 - INFO - Going to convert document batch...
2025-11-14 16:27:03,886 - INFO - Processing document 8-K_2023-12-22
2025-11-14 16:27:03,951 - INFO - Finished converting document 8-K_2023-12-22 in 0.16 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-11-30' --> 'data\processed_data\DIS\8-K_2023-11-30.md'


2025-11-14 16:27:04,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:04,078 - INFO - Going to convert document batch...
2025-11-14 16:27:04,078 - INFO - Processing document 8-K_2024-02-07
2025-11-14 16:27:04,139 - INFO - Finished converting document 8-K_2024-02-07 in 0.16 sec.


Converted 'data\edgar_documents\DIS\8-K_2023-12-22' --> 'data\processed_data\DIS\8-K_2023-12-22.md'


2025-11-14 16:27:04,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:04,234 - INFO - Going to convert document batch...
2025-11-14 16:27:04,235 - INFO - Processing document 8-K_2024-02-28
2025-11-14 16:27:04,295 - INFO - Finished converting document 8-K_2024-02-28 in 0.12 sec.


Converted 'data\edgar_documents\DIS\8-K_2024-02-07' --> 'data\processed_data\DIS\8-K_2024-02-07.md'
Converted 'data\edgar_documents\DIS\8-K_2024-02-28' --> 'data\processed_data\DIS\8-K_2024-02-28.md'


2025-11-14 16:27:04,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:04,458 - INFO - Going to convert document batch...
2025-11-14 16:27:04,460 - INFO - Processing document 8-K_2024-03-04
2025-11-14 16:27:04,517 - INFO - Finished converting document 8-K_2024-03-04 in 0.17 sec.
2025-11-14 16:27:04,574 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:27:04,576 - ERROR - Input document 8-K_2024-04-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <I

Converted 'data\edgar_documents\DIS\8-K_2024-03-04' --> 'data\processed_data\DIS\8-K_2024-03-04.md'
Error processing data\edgar_documents\DIS\8-K_2024-04-03: File format not allowed: data\edgar_documents\DIS\8-K_2024-04-03
Error processing data\edgar_documents\DIS\8-K_2024-04-09: File format not allowed: data\edgar_documents\DIS\8-K_2024-04-09
Error processing data\edgar_documents\DIS\8-K_2024-04-17: File format not allowed: data\edgar_documents\DIS\8-K_2024-04-17


2025-11-14 16:27:04,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:04,838 - INFO - Going to convert document batch...
2025-11-14 16:27:04,840 - INFO - Processing document 8-K_2024-07-19
2025-11-14 16:27:04,950 - INFO - Finished converting document 8-K_2024-07-19 in 0.17 sec.


Converted 'data\edgar_documents\DIS\8-K_2024-05-07' --> 'data\processed_data\DIS\8-K_2024-05-07.md'


2025-11-14 16:27:05,013 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:05,044 - INFO - Going to convert document batch...
2025-11-14 16:27:05,045 - INFO - Processing document 8-K_2024-08-07
2025-11-14 16:27:05,118 - INFO - Finished converting document 8-K_2024-08-07 in 0.12 sec.
2025-11-14 16:27:05,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\8-K_2024-07-19' --> 'data\processed_data\DIS\8-K_2024-07-19.md'
Converted 'data\edgar_documents\DIS\8-K_2024-08-07' --> 'data\processed_data\DIS\8-K_2024-08-07.md'


2025-11-14 16:27:05,226 - INFO - Going to convert document batch...
2025-11-14 16:27:05,228 - INFO - Processing document 8-K_2024-10-21
2025-11-14 16:27:05,299 - INFO - Finished converting document 8-K_2024-10-21 in 0.14 sec.
2025-11-14 16:27:05,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:05,390 - INFO - Going to convert document batch...
2025-11-14 16:27:05,391 - INFO - Processing document 8-K_2024-11-14
2025-11-14 16:27:05,455 - INFO - Finished converting document 8-K_2024-11-14 in 0.11 sec.
2025-11-14 16:27:05,520 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:27:05,521 - ERROR - Input document 8-K_2025-01-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.C

Converted 'data\edgar_documents\DIS\8-K_2024-10-21' --> 'data\processed_data\DIS\8-K_2024-10-21.md'
Converted 'data\edgar_documents\DIS\8-K_2024-11-14' --> 'data\processed_data\DIS\8-K_2024-11-14.md'
Error processing data\edgar_documents\DIS\8-K_2025-01-06: File format not allowed: data\edgar_documents\DIS\8-K_2025-01-06


2025-11-14 16:27:05,578 - INFO - Going to convert document batch...
2025-11-14 16:27:05,580 - INFO - Processing document 8-K_2025-02-05
2025-11-14 16:27:05,678 - INFO - Finished converting document 8-K_2025-02-05 in 0.16 sec.
2025-11-14 16:27:05,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:05,782 - INFO - Going to convert document batch...
2025-11-14 16:27:05,784 - INFO - Processing document 8-K_2025-03-04
2025-11-14 16:27:05,851 - INFO - Finished converting document 8-K_2025-03-04 in 0.12 sec.


Converted 'data\edgar_documents\DIS\8-K_2025-02-05' --> 'data\processed_data\DIS\8-K_2025-02-05.md'
Converted 'data\edgar_documents\DIS\8-K_2025-03-04' --> 'data\processed_data\DIS\8-K_2025-03-04.md'


2025-11-14 16:27:05,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:06,031 - INFO - Going to convert document batch...
2025-11-14 16:27:06,033 - INFO - Processing document 8-K_2025-03-24
2025-11-14 16:27:06,233 - INFO - Finished converting document 8-K_2025-03-24 in 0.34 sec.
2025-11-14 16:27:06,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:06,417 - INFO - Going to convert document batch...
2025-11-14 16:27:06,418 - INFO - Processing document 8-K_2025-05-07
2025-11-14 16:27:06,480 - INFO - Finished converting document 8-K_2025-05-07 in 0.16 sec.


Converted 'data\edgar_documents\DIS\8-K_2025-03-24' --> 'data\processed_data\DIS\8-K_2025-03-24.md'


2025-11-14 16:27:06,558 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:06,592 - INFO - Going to convert document batch...
2025-11-14 16:27:06,593 - INFO - Processing document 8-K_2025-06-09
2025-11-14 16:27:06,659 - INFO - Finished converting document 8-K_2025-06-09 in 0.14 sec.


Converted 'data\edgar_documents\DIS\8-K_2025-05-07' --> 'data\processed_data\DIS\8-K_2025-05-07.md'


2025-11-14 16:27:06,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:06,779 - INFO - Going to convert document batch...
2025-11-14 16:27:06,781 - INFO - Processing document 8-K_2025-08-06
2025-11-14 16:27:06,853 - INFO - Finished converting document 8-K_2025-08-06 in 0.14 sec.


Converted 'data\edgar_documents\DIS\8-K_2025-06-09' --> 'data\processed_data\DIS\8-K_2025-06-09.md'


2025-11-14 16:27:06,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:06,955 - INFO - Going to convert document batch...
2025-11-14 16:27:06,957 - INFO - Processing document 8-K_2025-10-01
2025-11-14 16:27:07,033 - INFO - Finished converting document 8-K_2025-10-01 in 0.14 sec.
2025-11-14 16:27:07,097 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\8-K_2025-08-06' --> 'data\processed_data\DIS\8-K_2025-08-06.md'
Converted 'data\edgar_documents\DIS\8-K_2025-10-01' --> 'data\processed_data\DIS\8-K_2025-10-01.md'


2025-11-14 16:27:07,119 - INFO - Going to convert document batch...
2025-11-14 16:27:07,121 - INFO - Processing document 8-K_2025-10-16
2025-11-14 16:27:07,184 - INFO - Finished converting document 8-K_2025-10-16 in 0.12 sec.
2025-11-14 16:27:07,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:07,314 - INFO - Going to convert document batch...
2025-11-14 16:27:07,316 - INFO - Processing document 8-K_2025-11-07
2025-11-14 16:27:07,388 - INFO - Finished converting document 8-K_2025-11-07 in 0.17 sec.


Converted 'data\edgar_documents\DIS\8-K_2025-10-16' --> 'data\processed_data\DIS\8-K_2025-10-16.md'


2025-11-14 16:27:07,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DIS\8-K_2025-11-07' --> 'data\processed_data\DIS\8-K_2025-11-07.md'


2025-11-14 16:27:09,818 - INFO - Going to convert document batch...
2025-11-14 16:27:09,820 - INFO - Processing document DEF-14A_2025-01-23
2025-11-14 16:27:20,181 - INFO - Finished converting document DEF-14A_2025-01-23 in 12.75 sec.


Converted 'data\edgar_documents\DIS\DEF-14A_2025-01-23' --> 'data\processed_data\DIS\DEF-14A_2025-01-23.md'
Processed 116 new files. Errors: 5
Found 132 files to process in data\edgar_documents\DUK


2025-11-14 16:27:24,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:27:37,593 - INFO - Going to convert document batch...
2025-11-14 16:27:37,595 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:27:37,596 - INFO - Processing document 10-K_2023-02-27
2025-11-14 16:28:14,889 - INFO - Finished converting document 10-K_2023-02-27 in 51.06 sec.


Converted 'data\edgar_documents\DUK\10-K_2023-02-27' --> 'data\processed_data\DUK\10-K_2023-02-27.md'


2025-11-14 16:28:26,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:28:39,008 - INFO - Going to convert document batch...
2025-11-14 16:28:39,011 - INFO - Processing document 10-K_2024-02-23
2025-11-14 16:29:17,710 - INFO - Finished converting document 10-K_2024-02-23 in 51.16 sec.


Converted 'data\edgar_documents\DUK\10-K_2024-02-23' --> 'data\processed_data\DUK\10-K_2024-02-23.md'


2025-11-14 16:29:29,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:29:43,071 - INFO - Going to convert document batch...
2025-11-14 16:29:43,073 - INFO - Processing document 10-K_2025-02-27
2025-11-14 16:30:26,832 - INFO - Finished converting document 10-K_2025-02-27 in 58.02 sec.
2025-11-14 16:30:38,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DUK\10-K_2025-02-27' --> 'data\processed_data\DUK\10-K_2025-02-27.md'


2025-11-14 16:30:44,479 - INFO - Going to convert document batch...
2025-11-14 16:30:44,480 - INFO - Processing document 10-Q_2023-05-09
2025-11-14 16:30:58,609 - INFO - Finished converting document 10-Q_2023-05-09 in 20.17 sec.


Converted 'data\edgar_documents\DUK\10-Q_2023-05-09' --> 'data\processed_data\DUK\10-Q_2023-05-09.md'


2025-11-14 16:31:03,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:31:12,249 - INFO - Going to convert document batch...
2025-11-14 16:31:12,252 - INFO - Processing document 10-Q_2023-08-08
2025-11-14 16:31:30,857 - INFO - Finished converting document 10-Q_2023-08-08 in 27.28 sec.
2025-11-14 16:31:38,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DUK\10-Q_2023-08-08' --> 'data\processed_data\DUK\10-Q_2023-08-08.md'


2025-11-14 16:31:48,263 - INFO - Going to convert document batch...
2025-11-14 16:31:48,265 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 16:32:00,879 - INFO - Finished converting document 10-Q_2023-11-02 in 22.92 sec.
2025-11-14 16:32:07,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DUK\10-Q_2023-11-02' --> 'data\processed_data\DUK\10-Q_2023-11-02.md'


2025-11-14 16:32:14,102 - INFO - Going to convert document batch...
2025-11-14 16:32:14,103 - INFO - Processing document 10-Q_2024-05-07
2025-11-14 16:32:24,252 - INFO - Finished converting document 10-Q_2024-05-07 in 16.89 sec.
2025-11-14 16:32:28,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DUK\10-Q_2024-05-07' --> 'data\processed_data\DUK\10-Q_2024-05-07.md'


2025-11-14 16:32:36,885 - INFO - Going to convert document batch...
2025-11-14 16:32:36,886 - INFO - Processing document 10-Q_2024-08-06
2025-11-14 16:32:49,433 - INFO - Finished converting document 10-Q_2024-08-06 in 20.78 sec.
2025-11-14 16:32:54,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DUK\10-Q_2024-08-06' --> 'data\processed_data\DUK\10-Q_2024-08-06.md'


2025-11-14 16:33:02,996 - INFO - Going to convert document batch...
2025-11-14 16:33:02,999 - INFO - Processing document 10-Q_2024-11-07
2025-11-14 16:33:16,359 - INFO - Finished converting document 10-Q_2024-11-07 in 21.92 sec.
2025-11-14 16:33:21,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DUK\10-Q_2024-11-07' --> 'data\processed_data\DUK\10-Q_2024-11-07.md'


2025-11-14 16:33:28,900 - INFO - Going to convert document batch...
2025-11-14 16:33:28,901 - INFO - Processing document 10-Q_2025-05-06
2025-11-14 16:33:39,144 - INFO - Finished converting document 10-Q_2025-05-06 in 17.75 sec.


Converted 'data\edgar_documents\DUK\10-Q_2025-05-06' --> 'data\processed_data\DUK\10-Q_2025-05-06.md'


2025-11-14 16:33:43,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:33:52,899 - INFO - Going to convert document batch...
2025-11-14 16:33:52,902 - INFO - Processing document 10-Q_2025-08-05
2025-11-14 16:34:08,807 - INFO - Finished converting document 10-Q_2025-08-05 in 25.20 sec.


Converted 'data\edgar_documents\DUK\10-Q_2025-08-05' --> 'data\processed_data\DUK\10-Q_2025-08-05.md'


2025-11-14 16:34:14,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:24,525 - INFO - Going to convert document batch...
2025-11-14 16:34:24,526 - INFO - Processing document 10-Q_2025-11-07
2025-11-14 16:34:40,337 - INFO - Finished converting document 10-Q_2025-11-07 in 25.62 sec.
2025-11-14 16:34:45,376 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:45,378 - ERROR - Input document 4_2023-02-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <

Converted 'data\edgar_documents\DUK\10-Q_2025-11-07' --> 'data\processed_data\DUK\10-Q_2025-11-07.md'
Error processing data\edgar_documents\DUK\4_2023-02-06: File format not allowed: data\edgar_documents\DUK\4_2023-02-06


2025-11-14 16:34:45,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:45,702 - INFO - Going to convert document batch...
2025-11-14 16:34:45,704 - INFO - Processing document 4_2023-02-15
2025-11-14 16:34:45,770 - INFO - Finished converting document 4_2023-02-15 in 0.14 sec.


Converted 'data\edgar_documents\DUK\4_2023-02-08' --> 'data\processed_data\DUK\4_2023-02-08.md'


2025-11-14 16:34:45,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:45,873 - INFO - Going to convert document batch...
2025-11-14 16:34:45,875 - INFO - Processing document 4_2023-02-22
2025-11-14 16:34:45,945 - INFO - Finished converting document 4_2023-02-22 in 0.11 sec.


Converted 'data\edgar_documents\DUK\4_2023-02-15' --> 'data\processed_data\DUK\4_2023-02-15.md'


2025-11-14 16:34:46,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:46,149 - INFO - Going to convert document batch...
2025-11-14 16:34:46,151 - INFO - Processing document 4_2023-02-24
2025-11-14 16:34:46,223 - INFO - Finished converting document 4_2023-02-24 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2023-02-22' --> 'data\processed_data\DUK\4_2023-02-22.md'


2025-11-14 16:34:46,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:46,376 - INFO - Going to convert document batch...
2025-11-14 16:34:46,378 - INFO - Processing document 4_2023-02-27
2025-11-14 16:34:46,472 - INFO - Finished converting document 4_2023-02-27 in 0.17 sec.


Converted 'data\edgar_documents\DUK\4_2023-02-24' --> 'data\processed_data\DUK\4_2023-02-24.md'


2025-11-14 16:34:46,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:46,633 - INFO - Going to convert document batch...
2025-11-14 16:34:46,634 - INFO - Processing document 4_2023-04-05
2025-11-14 16:34:46,726 - INFO - Finished converting document 4_2023-04-05 in 0.17 sec.


Converted 'data\edgar_documents\DUK\4_2023-02-27' --> 'data\processed_data\DUK\4_2023-02-27.md'


2025-11-14 16:34:46,881 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:46,882 - ERROR - Input document 4_2023-04-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:46,886 - INFO - Going to convert document batch...
2025-11-14 16:34:46,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:46,934 - INFO - Going to convert document batch...
2025-11-14 16:34:46,936 - INFO - Processing document 4_2023-05-08


Converted 'data\edgar_documents\DUK\4_2023-04-05' --> 'data\processed_data\DUK\4_2023-04-05.md'
Error processing data\edgar_documents\DUK\4_2023-04-10: File format not allowed: data\edgar_documents\DUK\4_2023-04-10


2025-11-14 16:34:47,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:47,180 - INFO - Going to convert document batch...
2025-11-14 16:34:47,182 - INFO - Processing document 4_2023-05-09
2025-11-14 16:34:47,265 - INFO - Finished converting document 4_2023-05-09 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2023-05-08' --> 'data\processed_data\DUK\4_2023-05-08.md'


2025-11-14 16:34:47,415 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:47,417 - ERROR - Input document 4_2023-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:47,419 - INFO - Going to convert document batch...
2025-11-14 16:34:47,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:47,470 - INFO - Going to convert document batch...
2025-11-14 16:34:47,471 - INFO - Processing document 4_2023-05-23


Converted 'data\edgar_documents\DUK\4_2023-05-09' --> 'data\processed_data\DUK\4_2023-05-09.md'
Error processing data\edgar_documents\DUK\4_2023-05-15: File format not allowed: data\edgar_documents\DUK\4_2023-05-15


2025-11-14 16:34:47,544 - INFO - Finished converting document 4_2023-05-23 in 0.12 sec.
2025-11-14 16:34:47,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:47,709 - INFO - Going to convert document batch...
2025-11-14 16:34:47,713 - INFO - Processing document 4_2023-07-05
2025-11-14 16:34:47,791 - INFO - Finished converting document 4_2023-07-05 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2023-05-23' --> 'data\processed_data\DUK\4_2023-05-23.md'


2025-11-14 16:34:47,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:47,954 - INFO - Going to convert document batch...
2025-11-14 16:34:47,956 - INFO - Processing document 4_2023-07-07
2025-11-14 16:34:48,018 - INFO - Finished converting document 4_2023-07-07 in 0.14 sec.


Converted 'data\edgar_documents\DUK\4_2023-07-05' --> 'data\processed_data\DUK\4_2023-07-05.md'


2025-11-14 16:34:48,164 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:48,165 - ERROR - Input document 4_2023-08-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:48,167 - INFO - Going to convert document batch...
2025-11-14 16:34:48,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:48,210 - INFO - Going to convert document batch...
2025-11-14 16:34:48,212 - INFO - Processing document 4_2023-08-18
2025-11-14 16:34:48,282 - INFO - Fin

Converted 'data\edgar_documents\DUK\4_2023-07-07' --> 'data\processed_data\DUK\4_2023-07-07.md'
Error processing data\edgar_documents\DUK\4_2023-08-07: File format not allowed: data\edgar_documents\DUK\4_2023-08-07


2025-11-14 16:34:48,373 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:48,399 - INFO - Going to convert document batch...
2025-11-14 16:34:48,400 - INFO - Processing document 4_2023-08-21
2025-11-14 16:34:48,478 - INFO - Finished converting document 4_2023-08-21 in 0.11 sec.


Converted 'data\edgar_documents\DUK\4_2023-08-18' --> 'data\processed_data\DUK\4_2023-08-18.md'
Converted 'data\edgar_documents\DUK\4_2023-08-21' --> 'data\processed_data\DUK\4_2023-08-21.md'


2025-11-14 16:34:48,607 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:48,609 - ERROR - Input document 4_2023-09-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:48,613 - INFO - Going to convert document batch...
2025-11-14 16:34:48,642 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:48,643 - ERROR - Input document 4_2023-09-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\DUK\4_2023-09-05: File format not allowed: data\edgar_documents\DUK\4_2023-09-05
Error processing data\edgar_documents\DUK\4_2023-09-06: File format not allowed: data\edgar_documents\DUK\4_2023-09-06


2025-11-14 16:34:48,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:48,933 - INFO - Going to convert document batch...
2025-11-14 16:34:48,934 - INFO - Processing document 4_2023-11-22
2025-11-14 16:34:49,002 - INFO - Finished converting document 4_2023-11-22 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2023-10-04' --> 'data\processed_data\DUK\4_2023-10-04.md'


2025-11-14 16:34:49,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:49,155 - INFO - Going to convert document batch...
2025-11-14 16:34:49,157 - INFO - Processing document 4_2023-12-19


Converted 'data\edgar_documents\DUK\4_2023-11-22' --> 'data\processed_data\DUK\4_2023-11-22.md'


2025-11-14 16:34:49,314 - INFO - Finished converting document 4_2023-12-19 in 0.23 sec.
2025-11-14 16:34:49,464 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:49,468 - ERROR - Input document 4_2024-01-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:49,472 - INFO - Going to convert document batch...
2025-11-14 16:34:49,502 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:49,503 - ERROR - Input document 4_2024-01-03 with forma

Converted 'data\edgar_documents\DUK\4_2023-12-19' --> 'data\processed_data\DUK\4_2023-12-19.md'
Error processing data\edgar_documents\DUK\4_2024-01-02: File format not allowed: data\edgar_documents\DUK\4_2024-01-02
Error processing data\edgar_documents\DUK\4_2024-01-03: File format not allowed: data\edgar_documents\DUK\4_2024-01-03
Error processing data\edgar_documents\DUK\4_2024-01-09: File format not allowed: data\edgar_documents\DUK\4_2024-01-09
Error processing data\edgar_documents\DUK\4_2024-01-10: File format not allowed: data\edgar_documents\DUK\4_2024-01-10


2025-11-14 16:34:49,631 - INFO - Going to convert document batch...
2025-11-14 16:34:49,633 - INFO - Processing document 4_2024-02-07
2025-11-14 16:34:49,730 - INFO - Finished converting document 4_2024-02-07 in 0.16 sec.
2025-11-14 16:34:49,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:49,884 - INFO - Going to convert document batch...
2025-11-14 16:34:49,885 - INFO - Processing document 4_2024-02-13
2025-11-14 16:34:49,952 - INFO - Finished converting document 4_2024-02-13 in 0.14 sec.


Converted 'data\edgar_documents\DUK\4_2024-02-07' --> 'data\processed_data\DUK\4_2024-02-07.md'


2025-11-14 16:34:50,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:50,107 - INFO - Going to convert document batch...
2025-11-14 16:34:50,108 - INFO - Processing document 4_2024-02-26
2025-11-14 16:34:50,211 - INFO - Finished converting document 4_2024-02-26 in 0.19 sec.


Converted 'data\edgar_documents\DUK\4_2024-02-13' --> 'data\processed_data\DUK\4_2024-02-13.md'


2025-11-14 16:34:50,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:50,382 - INFO - Going to convert document batch...
2025-11-14 16:34:50,384 - INFO - Processing document 4_2024-03-13
2025-11-14 16:34:50,456 - INFO - Finished converting document 4_2024-03-13 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2024-02-26' --> 'data\processed_data\DUK\4_2024-02-26.md'


2025-11-14 16:34:50,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:50,619 - INFO - Going to convert document batch...
2025-11-14 16:34:50,621 - INFO - Processing document 4_2024-04-02
2025-11-14 16:34:50,707 - INFO - Finished converting document 4_2024-04-02 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2024-03-13' --> 'data\processed_data\DUK\4_2024-03-13.md'


2025-11-14 16:34:50,851 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:50,853 - ERROR - Input document 4_2024-04-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:50,857 - INFO - Going to convert document batch...
2025-11-14 16:34:50,884 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:50,885 - ERROR - Input document 4_2024-04-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\DUK\4_2024-04-02' --> 'data\processed_data\DUK\4_2024-04-02.md'
Error processing data\edgar_documents\DUK\4_2024-04-09: File format not allowed: data\edgar_documents\DUK\4_2024-04-09
Error processing data\edgar_documents\DUK\4_2024-04-10: File format not allowed: data\edgar_documents\DUK\4_2024-04-10


2025-11-14 16:34:51,027 - INFO - Finished converting document 4_2024-05-07 in 0.14 sec.
2025-11-14 16:34:51,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:51,180 - INFO - Going to convert document batch...
2025-11-14 16:34:51,183 - INFO - Processing document 4_2024-05-13
2025-11-14 16:34:51,265 - INFO - Finished converting document 4_2024-05-13 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2024-05-07' --> 'data\processed_data\DUK\4_2024-05-07.md'


2025-11-14 16:34:51,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:51,445 - INFO - Going to convert document batch...
2025-11-14 16:34:51,447 - INFO - Processing document 4_2024-05-14
2025-11-14 16:34:51,539 - INFO - Finished converting document 4_2024-05-14 in 0.17 sec.


Converted 'data\edgar_documents\DUK\4_2024-05-13' --> 'data\processed_data\DUK\4_2024-05-13.md'


2025-11-14 16:34:51,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:51,721 - INFO - Going to convert document batch...
2025-11-14 16:34:51,723 - INFO - Processing document 4_2024-05-15
2025-11-14 16:34:51,799 - INFO - Finished converting document 4_2024-05-15 in 0.12 sec.


Converted 'data\edgar_documents\DUK\4_2024-05-14' --> 'data\processed_data\DUK\4_2024-05-14.md'


2025-11-14 16:34:51,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:51,943 - INFO - Going to convert document batch...
2025-11-14 16:34:51,946 - INFO - Processing document 4_2024-05-16
2025-11-14 16:34:52,047 - INFO - Finished converting document 4_2024-05-16 in 0.17 sec.


Converted 'data\edgar_documents\DUK\4_2024-05-15' --> 'data\processed_data\DUK\4_2024-05-15.md'


2025-11-14 16:34:52,167 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:52,200 - INFO - Going to convert document batch...
2025-11-14 16:34:52,203 - INFO - Processing document 4_2024-05-21
2025-11-14 16:34:52,293 - INFO - Finished converting document 4_2024-05-21 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2024-05-16' --> 'data\processed_data\DUK\4_2024-05-16.md'


2025-11-14 16:34:52,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:52,446 - INFO - Going to convert document batch...
2025-11-14 16:34:52,447 - INFO - Processing document 4_2024-05-22
2025-11-14 16:34:52,547 - INFO - Finished converting document 4_2024-05-22 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2024-05-21' --> 'data\processed_data\DUK\4_2024-05-21.md'


2025-11-14 16:34:52,683 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:52,684 - ERROR - Input document 4_2024-06-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:52,689 - INFO - Going to convert document batch...
2025-11-14 16:34:52,723 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:52,724 - ERROR - Input document 4_2024-06-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\DUK\4_2024-05-22' --> 'data\processed_data\DUK\4_2024-05-22.md'
Error processing data\edgar_documents\DUK\4_2024-06-05: File format not allowed: data\edgar_documents\DUK\4_2024-06-05
Error processing data\edgar_documents\DUK\4_2024-06-06: File format not allowed: data\edgar_documents\DUK\4_2024-06-06


2025-11-14 16:34:52,927 - INFO - Finished converting document 4_2024-07-03 in 0.19 sec.
2025-11-14 16:34:53,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:53,171 - INFO - Going to convert document batch...
2025-11-14 16:34:53,175 - INFO - Processing document 4_2024-08-12


Converted 'data\edgar_documents\DUK\4_2024-07-03' --> 'data\processed_data\DUK\4_2024-07-03.md'


2025-11-14 16:34:53,260 - INFO - Finished converting document 4_2024-08-12 in 0.22 sec.
2025-11-14 16:34:53,518 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:53,520 - ERROR - Input document 4_2024-08-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:53,523 - INFO - Going to convert document batch...
2025-11-14 16:34:53,558 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:53,559 - ERROR - Input document 4_2024-08-20 with forma

Converted 'data\edgar_documents\DUK\4_2024-08-12' --> 'data\processed_data\DUK\4_2024-08-12.md'
Error processing data\edgar_documents\DUK\4_2024-08-19: File format not allowed: data\edgar_documents\DUK\4_2024-08-19
Error processing data\edgar_documents\DUK\4_2024-08-20: File format not allowed: data\edgar_documents\DUK\4_2024-08-20


2025-11-14 16:34:53,802 - INFO - Finished converting document 4_2024-08-26 in 0.23 sec.
2025-11-14 16:34:53,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:53,955 - INFO - Going to convert document batch...
2025-11-14 16:34:53,956 - INFO - Processing document 4_2024-10-04
2025-11-14 16:34:54,099 - INFO - Finished converting document 4_2024-10-04 in 0.20 sec.


Converted 'data\edgar_documents\DUK\4_2024-08-26' --> 'data\processed_data\DUK\4_2024-08-26.md'


2025-11-14 16:34:54,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:54,268 - INFO - Going to convert document batch...
2025-11-14 16:34:54,271 - INFO - Processing document 4_2024-11-18
2025-11-14 16:34:54,353 - INFO - Finished converting document 4_2024-11-18 in 0.14 sec.


Converted 'data\edgar_documents\DUK\4_2024-10-04' --> 'data\processed_data\DUK\4_2024-10-04.md'


2025-11-14 16:34:54,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:54,476 - INFO - Going to convert document batch...
2025-11-14 16:34:54,478 - INFO - Processing document 4_2024-12-02
2025-11-14 16:34:54,549 - INFO - Finished converting document 4_2024-12-02 in 0.12 sec.


Converted 'data\edgar_documents\DUK\4_2024-11-18' --> 'data\processed_data\DUK\4_2024-11-18.md'


2025-11-14 16:34:54,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:54,694 - INFO - Going to convert document batch...
2025-11-14 16:34:54,696 - INFO - Processing document 4_2024-12-18
2025-11-14 16:34:54,779 - INFO - Finished converting document 4_2024-12-18 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2024-12-02' --> 'data\processed_data\DUK\4_2024-12-02.md'


2025-11-14 16:34:54,881 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:54,883 - ERROR - Input document 4_2024-12-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:54,886 - INFO - Going to convert document batch...
2025-11-14 16:34:54,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:54,961 - INFO - Going to convert document batch...
2025-11-14 16:34:54,963 - INFO - Processing document 4_2025-02-11


Converted 'data\edgar_documents\DUK\4_2024-12-18' --> 'data\processed_data\DUK\4_2024-12-18.md'
Error processing data\edgar_documents\DUK\4_2024-12-23: File format not allowed: data\edgar_documents\DUK\4_2024-12-23


2025-11-14 16:34:55,064 - INFO - Finished converting document 4_2025-02-11 in 0.17 sec.
2025-11-14 16:34:55,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:55,236 - INFO - Going to convert document batch...
2025-11-14 16:34:55,238 - INFO - Processing document 4_2025-02-20
2025-11-14 16:34:55,337 - INFO - Finished converting document 4_2025-02-20 in 0.19 sec.


Converted 'data\edgar_documents\DUK\4_2025-02-11' --> 'data\processed_data\DUK\4_2025-02-11.md'


2025-11-14 16:34:55,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:55,490 - INFO - Going to convert document batch...
2025-11-14 16:34:55,494 - INFO - Processing document 4_2025-02-25
2025-11-14 16:34:55,590 - INFO - Finished converting document 4_2025-02-25 in 0.17 sec.


Converted 'data\edgar_documents\DUK\4_2025-02-20' --> 'data\processed_data\DUK\4_2025-02-20.md'


2025-11-14 16:34:55,696 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:55,725 - INFO - Going to convert document batch...
2025-11-14 16:34:55,727 - INFO - Processing document 4_2025-02-28
2025-11-14 16:34:55,818 - INFO - Finished converting document 4_2025-02-28 in 0.14 sec.


Converted 'data\edgar_documents\DUK\4_2025-02-25' --> 'data\processed_data\DUK\4_2025-02-25.md'


2025-11-14 16:34:55,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:56,030 - INFO - Going to convert document batch...
2025-11-14 16:34:56,038 - INFO - Processing document 4_2025-03-03
2025-11-14 16:34:56,135 - INFO - Finished converting document 4_2025-03-03 in 0.22 sec.


Converted 'data\edgar_documents\DUK\4_2025-02-28' --> 'data\processed_data\DUK\4_2025-02-28.md'


2025-11-14 16:34:56,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:56,253 - INFO - Going to convert document batch...
2025-11-14 16:34:56,255 - INFO - Processing document 4_2025-04-03
2025-11-14 16:34:56,327 - INFO - Finished converting document 4_2025-04-03 in 0.11 sec.
2025-11-14 16:34:56,413 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DUK\4_2025-03-03' --> 'data\processed_data\DUK\4_2025-03-03.md'
Converted 'data\edgar_documents\DUK\4_2025-04-03' --> 'data\processed_data\DUK\4_2025-04-03.md'


2025-11-14 16:34:56,441 - INFO - Going to convert document batch...
2025-11-14 16:34:56,442 - INFO - Processing document 4_2025-04-04
2025-11-14 16:34:56,521 - INFO - Finished converting document 4_2025-04-04 in 0.12 sec.
2025-11-14 16:34:56,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:56,642 - INFO - Going to convert document batch...
2025-11-14 16:34:56,644 - INFO - Processing document 4_2025-05-02
2025-11-14 16:34:56,735 - INFO - Finished converting document 4_2025-05-02 in 0.14 sec.


Converted 'data\edgar_documents\DUK\4_2025-04-04' --> 'data\processed_data\DUK\4_2025-04-04.md'


2025-11-14 16:34:56,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:56,870 - INFO - Going to convert document batch...
2025-11-14 16:34:56,873 - INFO - Processing document 4_2025-05-05
2025-11-14 16:34:56,961 - INFO - Finished converting document 4_2025-05-05 in 0.14 sec.


Converted 'data\edgar_documents\DUK\4_2025-05-02' --> 'data\processed_data\DUK\4_2025-05-02.md'


2025-11-14 16:34:57,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:57,107 - INFO - Going to convert document batch...
2025-11-14 16:34:57,109 - INFO - Processing document 4_2025-07-07
2025-11-14 16:34:57,190 - INFO - Finished converting document 4_2025-07-07 in 0.16 sec.


Converted 'data\edgar_documents\DUK\4_2025-05-05' --> 'data\processed_data\DUK\4_2025-05-05.md'


2025-11-14 16:34:57,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:57,330 - INFO - Going to convert document batch...
2025-11-14 16:34:57,332 - INFO - Processing document 4_2025-08-08
2025-11-14 16:34:57,438 - INFO - Finished converting document 4_2025-08-08 in 0.17 sec.


Converted 'data\edgar_documents\DUK\4_2025-07-07' --> 'data\processed_data\DUK\4_2025-07-07.md'


2025-11-14 16:34:57,556 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:57,590 - INFO - Going to convert document batch...
2025-11-14 16:34:57,593 - INFO - Processing document 4_2025-08-12
2025-11-14 16:34:57,680 - INFO - Finished converting document 4_2025-08-12 in 0.14 sec.


Converted 'data\edgar_documents\DUK\4_2025-08-08' --> 'data\processed_data\DUK\4_2025-08-08.md'


2025-11-14 16:34:57,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:57,956 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\DUK\4_2025-08-12' --> 'data\processed_data\DUK\4_2025-08-12.md'


2025-11-14 16:34:57,958 - INFO - Processing document 4_2025-08-13
2025-11-14 16:34:58,053 - INFO - Finished converting document 4_2025-08-13 in 0.28 sec.
2025-11-14 16:34:58,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:58,200 - INFO - Going to convert document batch...
2025-11-14 16:34:58,202 - INFO - Processing document 4_2025-08-21
2025-11-14 16:34:58,301 - INFO - Finished converting document 4_2025-08-21 in 0.14 sec.


Converted 'data\edgar_documents\DUK\4_2025-08-13' --> 'data\processed_data\DUK\4_2025-08-13.md'


2025-11-14 16:34:58,452 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:58,455 - ERROR - Input document 4_2025-09-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:58,459 - INFO - Going to convert document batch...
2025-11-14 16:34:58,512 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:58,514 - ERROR - Input document 4_2025-09-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\DUK\4_2025-08-21' --> 'data\processed_data\DUK\4_2025-08-21.md'
Error processing data\edgar_documents\DUK\4_2025-09-08: File format not allowed: data\edgar_documents\DUK\4_2025-09-08
Error processing data\edgar_documents\DUK\4_2025-09-09: File format not allowed: data\edgar_documents\DUK\4_2025-09-09


2025-11-14 16:34:58,649 - INFO - Finished converting document 4_2025-09-16 in 0.12 sec.
2025-11-14 16:34:58,784 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:58,786 - ERROR - Input document 4_2025-09-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:58,790 - INFO - Going to convert document batch...
2025-11-14 16:34:58,809 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:58,811 - ERROR - Input document 4_2025-10-01 with forma

Converted 'data\edgar_documents\DUK\4_2025-09-16' --> 'data\processed_data\DUK\4_2025-09-16.md'
Error processing data\edgar_documents\DUK\4_2025-09-29: File format not allowed: data\edgar_documents\DUK\4_2025-09-29
Error processing data\edgar_documents\DUK\4_2025-10-01: File format not allowed: data\edgar_documents\DUK\4_2025-10-01


2025-11-14 16:34:59,134 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:34:59,135 - ERROR - Input document 4_2025-11-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:34:59,139 - INFO - Going to convert document batch...
2025-11-14 16:34:59,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:59,236 - INFO - Going to convert document batch...
2025-11-14 16:34:59,238 - INFO - Processing document 8-K_2023-01-03


Converted 'data\edgar_documents\DUK\4_2025-10-03' --> 'data\processed_data\DUK\4_2025-10-03.md'
Error processing data\edgar_documents\DUK\4_2025-11-10: File format not allowed: data\edgar_documents\DUK\4_2025-11-10


2025-11-14 16:34:59,408 - INFO - Finished converting document 8-K_2023-01-03 in 0.27 sec.
2025-11-14 16:34:59,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:59,680 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\DUK\8-K_2023-01-03' --> 'data\processed_data\DUK\8-K_2023-01-03.md'


2025-11-14 16:34:59,682 - INFO - Processing document 8-K_2023-01-19
2025-11-14 16:34:59,796 - INFO - Finished converting document 8-K_2023-01-19 in 0.30 sec.
2025-11-14 16:34:59,906 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:34:59,953 - INFO - Going to convert document batch...
2025-11-14 16:34:59,955 - INFO - Processing document 8-K_2023-02-09
2025-11-14 16:35:00,026 - INFO - Finished converting document 8-K_2023-02-09 in 0.16 sec.


Converted 'data\edgar_documents\DUK\8-K_2023-01-19' --> 'data\processed_data\DUK\8-K_2023-01-19.md'
Converted 'data\edgar_documents\DUK\8-K_2023-02-09' --> 'data\processed_data\DUK\8-K_2023-02-09.md'


2025-11-14 16:35:00,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:00,224 - INFO - Going to convert document batch...
2025-11-14 16:35:00,226 - INFO - Processing document 8-K_2023-03-10
2025-11-14 16:35:00,285 - INFO - Finished converting document 8-K_2023-03-10 in 0.20 sec.
2025-11-14 16:35:00,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:00,531 - INFO - Going to convert document batch...
2025-11-14 16:35:00,532 - INFO - Processing document 8-K_2023-04-03


Converted 'data\edgar_documents\DUK\8-K_2023-03-10' --> 'data\processed_data\DUK\8-K_2023-03-10.md'


2025-11-14 16:35:00,743 - INFO - Finished converting document 8-K_2023-04-03 in 0.33 sec.
2025-11-14 16:35:00,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:00,926 - INFO - Going to convert document batch...
2025-11-14 16:35:00,929 - INFO - Processing document 8-K_2023-04-04
2025-11-14 16:35:01,002 - INFO - Finished converting document 8-K_2023-04-04 in 0.14 sec.


Converted 'data\edgar_documents\DUK\8-K_2023-04-03' --> 'data\processed_data\DUK\8-K_2023-04-03.md'
Converted 'data\edgar_documents\DUK\8-K_2023-04-04' --> 'data\processed_data\DUK\8-K_2023-04-04.md'


2025-11-14 16:35:01,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:01,186 - INFO - Going to convert document batch...
2025-11-14 16:35:01,189 - INFO - Processing document 8-K_2023-04-06
2025-11-14 16:35:01,292 - INFO - Finished converting document 8-K_2023-04-06 in 0.25 sec.
2025-11-14 16:35:01,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:01,500 - INFO - Going to convert document batch...
2025-11-14 16:35:01,502 - INFO - Processing document 8-K_2023-04-28


Converted 'data\edgar_documents\DUK\8-K_2023-04-06' --> 'data\processed_data\DUK\8-K_2023-04-06.md'


2025-11-14 16:35:01,595 - INFO - Finished converting document 8-K_2023-04-28 in 0.22 sec.
2025-11-14 16:35:01,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:01,841 - INFO - Going to convert document batch...
2025-11-14 16:35:01,843 - INFO - Processing document 8-K_2023-05-09


Converted 'data\edgar_documents\DUK\8-K_2023-04-28' --> 'data\processed_data\DUK\8-K_2023-04-28.md'


2025-11-14 16:35:02,177 - INFO - Finished converting document 8-K_2023-05-09 in 0.47 sec.
2025-11-14 16:35:02,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:02,499 - INFO - Going to convert document batch...
2025-11-14 16:35:02,502 - INFO - Processing document 8-K_2023-06-12


Converted 'data\edgar_documents\DUK\8-K_2023-05-09' --> 'data\processed_data\DUK\8-K_2023-05-09.md'


2025-11-14 16:35:02,699 - INFO - Finished converting document 8-K_2023-06-12 in 0.34 sec.
2025-11-14 16:35:02,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:02,940 - INFO - Going to convert document batch...
2025-11-14 16:35:02,942 - INFO - Processing document 8-K_2023-08-08


Converted 'data\edgar_documents\DUK\8-K_2023-06-12' --> 'data\processed_data\DUK\8-K_2023-06-12.md'


2025-11-14 16:35:03,028 - INFO - Finished converting document 8-K_2023-08-08 in 0.20 sec.
2025-11-14 16:35:03,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:03,188 - INFO - Going to convert document batch...
2025-11-14 16:35:03,190 - INFO - Processing document 8-K_2023-08-21


Converted 'data\edgar_documents\DUK\8-K_2023-08-08' --> 'data\processed_data\DUK\8-K_2023-08-08.md'


2025-11-14 16:35:03,287 - INFO - Finished converting document 8-K_2023-08-21 in 0.20 sec.
2025-11-14 16:35:03,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:03,437 - INFO - Going to convert document batch...
2025-11-14 16:35:03,439 - INFO - Processing document 8-K_2023-08-22


Converted 'data\edgar_documents\DUK\8-K_2023-08-21' --> 'data\processed_data\DUK\8-K_2023-08-21.md'


2025-11-14 16:35:03,573 - INFO - Finished converting document 8-K_2023-08-22 in 0.22 sec.
2025-11-14 16:35:03,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:03,782 - INFO - Going to convert document batch...
2025-11-14 16:35:03,785 - INFO - Processing document 8-K_2023-08-28


Converted 'data\edgar_documents\DUK\8-K_2023-08-22' --> 'data\processed_data\DUK\8-K_2023-08-22.md'


2025-11-14 16:35:03,883 - INFO - Finished converting document 8-K_2023-08-28 in 0.22 sec.
2025-11-14 16:35:04,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:04,079 - INFO - Going to convert document batch...
2025-11-14 16:35:04,081 - INFO - Processing document 8-K_2023-09-08


Converted 'data\edgar_documents\DUK\8-K_2023-08-28' --> 'data\processed_data\DUK\8-K_2023-08-28.md'


2025-11-14 16:35:04,213 - INFO - Finished converting document 8-K_2023-09-08 in 0.27 sec.
2025-11-14 16:35:04,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:04,410 - INFO - Going to convert document batch...
2025-11-14 16:35:04,412 - INFO - Processing document 8-K_2023-11-02
2025-11-14 16:35:04,490 - INFO - Finished converting document 8-K_2023-11-02 in 0.19 sec.


Converted 'data\edgar_documents\DUK\8-K_2023-09-08' --> 'data\processed_data\DUK\8-K_2023-09-08.md'


2025-11-14 16:35:04,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:04,653 - INFO - Going to convert document batch...
2025-11-14 16:35:04,656 - INFO - Processing document 8-K_2023-12-18


Converted 'data\edgar_documents\DUK\8-K_2023-11-02' --> 'data\processed_data\DUK\8-K_2023-11-02.md'


2025-11-14 16:35:04,780 - INFO - Finished converting document 8-K_2023-12-18 in 0.23 sec.
2025-11-14 16:35:04,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:04,983 - INFO - Going to convert document batch...
2025-11-14 16:35:04,986 - INFO - Processing document 8-K_2023-12-19
2025-11-14 16:35:05,070 - INFO - Finished converting document 8-K_2023-12-19 in 0.20 sec.


Converted 'data\edgar_documents\DUK\8-K_2023-12-18' --> 'data\processed_data\DUK\8-K_2023-12-18.md'


2025-11-14 16:35:05,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:05,258 - INFO - Going to convert document batch...
2025-11-14 16:35:05,259 - INFO - Processing document 8-K_2024-01-05


Converted 'data\edgar_documents\DUK\8-K_2023-12-19' --> 'data\processed_data\DUK\8-K_2023-12-19.md'


2025-11-14 16:35:05,369 - INFO - Finished converting document 8-K_2024-01-05 in 0.23 sec.
2025-11-14 16:35:05,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:05,560 - INFO - Going to convert document batch...
2025-11-14 16:35:05,562 - INFO - Processing document 8-K_2024-01-12


Converted 'data\edgar_documents\DUK\8-K_2024-01-05' --> 'data\processed_data\DUK\8-K_2024-01-05.md'


2025-11-14 16:35:05,655 - INFO - Finished converting document 8-K_2024-01-12 in 0.22 sec.
2025-11-14 16:35:05,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:05,840 - INFO - Going to convert document batch...
2025-11-14 16:35:05,843 - INFO - Processing document 8-K_2024-01-31


Converted 'data\edgar_documents\DUK\8-K_2024-01-12' --> 'data\processed_data\DUK\8-K_2024-01-12.md'


2025-11-14 16:35:05,975 - INFO - Finished converting document 8-K_2024-01-31 in 0.24 sec.
2025-11-14 16:35:06,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:06,186 - INFO - Going to convert document batch...
2025-11-14 16:35:06,190 - INFO - Processing document 8-K_2024-02-08
2025-11-14 16:35:06,280 - INFO - Finished converting document 8-K_2024-02-08 in 0.17 sec.


Converted 'data\edgar_documents\DUK\8-K_2024-01-31' --> 'data\processed_data\DUK\8-K_2024-01-31.md'


2025-11-14 16:35:06,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:06,425 - INFO - Going to convert document batch...
2025-11-14 16:35:06,428 - INFO - Processing document 8-K_2024-03-15
2025-11-14 16:35:06,536 - INFO - Finished converting document 8-K_2024-03-15 in 0.19 sec.


Converted 'data\edgar_documents\DUK\8-K_2024-02-08' --> 'data\processed_data\DUK\8-K_2024-02-08.md'


2025-11-14 16:35:06,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:06,719 - INFO - Going to convert document batch...
2025-11-14 16:35:06,722 - INFO - Processing document 8-K_2024-04-12


Converted 'data\edgar_documents\DUK\8-K_2024-03-15' --> 'data\processed_data\DUK\8-K_2024-03-15.md'


2025-11-14 16:35:06,854 - INFO - Finished converting document 8-K_2024-04-12 in 0.26 sec.
2025-11-14 16:35:06,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:07,044 - INFO - Going to convert document batch...
2025-11-14 16:35:07,047 - INFO - Processing document 8-K_2024-05-07
2025-11-14 16:35:07,135 - INFO - Finished converting document 8-K_2024-05-07 in 0.20 sec.


Converted 'data\edgar_documents\DUK\8-K_2024-04-12' --> 'data\processed_data\DUK\8-K_2024-04-12.md'


2025-11-14 16:35:07,264 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:35:07,266 - ERROR - Input document 8-K_2024-05-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:35:07,270 - INFO - Going to convert document batch...
2025-11-14 16:35:07,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:07,364 - INFO - Going to convert document batch...
2025-11-14 16:35:07,366 - INFO - Processing document 8-K_2024-06

Converted 'data\edgar_documents\DUK\8-K_2024-05-07' --> 'data\processed_data\DUK\8-K_2024-05-07.md'
Error processing data\edgar_documents\DUK\8-K_2024-05-13: File format not allowed: data\edgar_documents\DUK\8-K_2024-05-13


2025-11-14 16:35:07,507 - INFO - Finished converting document 8-K_2024-06-07 in 0.23 sec.
2025-11-14 16:35:07,649 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:07,714 - INFO - Going to convert document batch...
2025-11-14 16:35:07,717 - INFO - Processing document 8-K_2024-07-08


Converted 'data\edgar_documents\DUK\8-K_2024-06-07' --> 'data\processed_data\DUK\8-K_2024-06-07.md'


2025-11-14 16:35:07,882 - INFO - Finished converting document 8-K_2024-07-08 in 0.28 sec.
2025-11-14 16:35:08,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:08,108 - INFO - Going to convert document batch...
2025-11-14 16:35:08,110 - INFO - Processing document 8-K_2024-07-15


Converted 'data\edgar_documents\DUK\8-K_2024-07-08' --> 'data\processed_data\DUK\8-K_2024-07-08.md'


2025-11-14 16:35:08,217 - INFO - Finished converting document 8-K_2024-07-15 in 0.24 sec.
2025-11-14 16:35:08,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:08,415 - INFO - Going to convert document batch...
2025-11-14 16:35:08,418 - INFO - Processing document 8-K_2024-08-06
2025-11-14 16:35:08,484 - INFO - Finished converting document 8-K_2024-08-06 in 0.19 sec.


Converted 'data\edgar_documents\DUK\8-K_2024-07-15' --> 'data\processed_data\DUK\8-K_2024-07-15.md'


2025-11-14 16:35:08,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:08,648 - INFO - Going to convert document batch...
2025-11-14 16:35:08,651 - INFO - Processing document 8-K_2024-08-22


Converted 'data\edgar_documents\DUK\8-K_2024-08-06' --> 'data\processed_data\DUK\8-K_2024-08-06.md'


2025-11-14 16:35:08,811 - INFO - Finished converting document 8-K_2024-08-22 in 0.28 sec.
2025-11-14 16:35:08,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:08,961 - INFO - Going to convert document batch...
2025-11-14 16:35:08,963 - INFO - Processing document 8-K_2024-11-07
2025-11-14 16:35:09,028 - INFO - Finished converting document 8-K_2024-11-07 in 0.12 sec.


Converted 'data\edgar_documents\DUK\8-K_2024-08-22' --> 'data\processed_data\DUK\8-K_2024-08-22.md'
Converted 'data\edgar_documents\DUK\8-K_2024-11-07' --> 'data\processed_data\DUK\8-K_2024-11-07.md'


2025-11-14 16:35:09,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:09,156 - INFO - Going to convert document batch...
2025-11-14 16:35:09,158 - INFO - Processing document 8-K_2025-01-13
2025-11-14 16:35:09,271 - INFO - Finished converting document 8-K_2025-01-13 in 0.19 sec.
2025-11-14 16:35:09,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:09,463 - INFO - Going to convert document batch...
2025-11-14 16:35:09,465 - INFO - Processing document 8-K_2025-02-03
2025-11-14 16:35:09,543 - INFO - Finished converting document 8-K_2025-02-03 in 0.19 sec.


Converted 'data\edgar_documents\DUK\8-K_2025-01-13' --> 'data\processed_data\DUK\8-K_2025-01-13.md'


2025-11-14 16:35:09,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:09,666 - INFO - Going to convert document batch...
2025-11-14 16:35:09,668 - INFO - Processing document 8-K_2025-02-13
2025-11-14 16:35:09,755 - INFO - Finished converting document 8-K_2025-02-13 in 0.16 sec.


Converted 'data\edgar_documents\DUK\8-K_2025-02-03' --> 'data\processed_data\DUK\8-K_2025-02-03.md'


2025-11-14 16:35:09,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:09,958 - INFO - Going to convert document batch...
2025-11-14 16:35:09,962 - INFO - Processing document 8-K_2025-03-17


Converted 'data\edgar_documents\DUK\8-K_2025-02-13' --> 'data\processed_data\DUK\8-K_2025-02-13.md'


2025-11-14 16:35:10,297 - INFO - Finished converting document 8-K_2025-03-17 in 0.48 sec.
2025-11-14 16:35:10,471 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:10,588 - INFO - Going to convert document batch...
2025-11-14 16:35:10,591 - INFO - Processing document 8-K_2025-05-05


Converted 'data\edgar_documents\DUK\8-K_2025-03-17' --> 'data\processed_data\DUK\8-K_2025-03-17.md'


2025-11-14 16:35:10,830 - INFO - Finished converting document 8-K_2025-05-05 in 0.39 sec.
2025-11-14 16:35:11,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:11,065 - INFO - Going to convert document batch...
2025-11-14 16:35:11,067 - INFO - Processing document 8-K_2025-05-06
2025-11-14 16:35:11,129 - INFO - Finished converting document 8-K_2025-05-06 in 0.16 sec.


Converted 'data\edgar_documents\DUK\8-K_2025-05-05' --> 'data\processed_data\DUK\8-K_2025-05-05.md'


2025-11-14 16:35:11,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:11,327 - INFO - Going to convert document batch...
2025-11-14 16:35:11,329 - INFO - Processing document 8-K_2025-07-29


Converted 'data\edgar_documents\DUK\8-K_2025-05-06' --> 'data\processed_data\DUK\8-K_2025-05-06.md'


2025-11-14 16:35:11,524 - INFO - Finished converting document 8-K_2025-07-29 in 0.34 sec.
2025-11-14 16:35:11,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:11,737 - INFO - Going to convert document batch...
2025-11-14 16:35:11,739 - INFO - Processing document 8-K_2025-08-05
2025-11-14 16:35:11,809 - INFO - Finished converting document 8-K_2025-08-05 in 0.16 sec.


Converted 'data\edgar_documents\DUK\8-K_2025-07-29' --> 'data\processed_data\DUK\8-K_2025-07-29.md'


2025-11-14 16:35:11,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:11,990 - INFO - Going to convert document batch...
2025-11-14 16:35:11,991 - INFO - Processing document 8-K_2025-09-11


Converted 'data\edgar_documents\DUK\8-K_2025-08-05' --> 'data\processed_data\DUK\8-K_2025-08-05.md'


2025-11-14 16:35:12,125 - INFO - Finished converting document 8-K_2025-09-11 in 0.25 sec.
2025-11-14 16:35:12,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:12,305 - INFO - Going to convert document batch...
2025-11-14 16:35:12,307 - INFO - Processing document 8-K_2025-09-12
2025-11-14 16:35:12,390 - INFO - Finished converting document 8-K_2025-09-12 in 0.19 sec.


Converted 'data\edgar_documents\DUK\8-K_2025-09-11' --> 'data\processed_data\DUK\8-K_2025-09-11.md'


2025-11-14 16:35:12,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:12,586 - INFO - Going to convert document batch...
2025-11-14 16:35:12,588 - INFO - Processing document 8-K_2025-10-30


Converted 'data\edgar_documents\DUK\8-K_2025-09-12' --> 'data\processed_data\DUK\8-K_2025-09-12.md'


2025-11-14 16:35:12,737 - INFO - Finished converting document 8-K_2025-10-30 in 0.28 sec.
2025-11-14 16:35:12,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:12,896 - INFO - Going to convert document batch...
2025-11-14 16:35:12,898 - INFO - Processing document 8-K_2025-11-07
2025-11-14 16:35:12,983 - INFO - Finished converting document 8-K_2025-11-07 in 0.16 sec.


Converted 'data\edgar_documents\DUK\8-K_2025-10-30' --> 'data\processed_data\DUK\8-K_2025-10-30.md'


2025-11-14 16:35:13,154 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:35:13,156 - ERROR - Input document DEF-14A_2023-03-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:35:13,164 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\DUK\8-K_2025-11-07' --> 'data\processed_data\DUK\8-K_2025-11-07.md'
Error processing data\edgar_documents\DUK\DEF-14A_2023-03-23: File format not allowed: data\edgar_documents\DUK\DEF-14A_2023-03-23


2025-11-14 16:35:13,278 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:35:13,279 - ERROR - Input document DEF-14A_2024-03-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:35:13,288 - INFO - Going to convert document batch...
2025-11-14 16:35:13,403 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:35:13,406 - ERROR - Input document DEF-14A_2025-03-14 with format No

Error processing data\edgar_documents\DUK\DEF-14A_2024-03-22: File format not allowed: data\edgar_documents\DUK\DEF-14A_2024-03-22
Error processing data\edgar_documents\DUK\DEF-14A_2025-03-14: File format not allowed: data\edgar_documents\DUK\DEF-14A_2025-03-14
Processed 106 new files. Errors: 26
Found 83 files to process in data\edgar_documents\EMR


2025-11-14 16:35:13,556 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:35:17,942 - INFO - Going to convert document batch...
2025-11-14 16:35:17,944 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:35:17,946 - INFO - Processing document 10-K_2023-11-13
2025-11-14 16:35:23,099 - INFO - Finished converting document 10-K_2023-11-13 in 9.64 sec.
2025-11-14 16:35:24,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-K_2023-11-13' --> 'data\processed_data\EMR\10-K_2023-11-13.md'


2025-11-14 16:35:27,805 - INFO - Going to convert document batch...
2025-11-14 16:35:27,808 - INFO - Processing document 10-K_2024-11-12
2025-11-14 16:35:32,720 - INFO - Finished converting document 10-K_2024-11-12 in 7.91 sec.
2025-11-14 16:35:34,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-K_2024-11-12' --> 'data\processed_data\EMR\10-K_2024-11-12.md'


2025-11-14 16:35:37,505 - INFO - Going to convert document batch...
2025-11-14 16:35:37,507 - INFO - Processing document 10-K_2025-11-10
2025-11-14 16:35:42,709 - INFO - Finished converting document 10-K_2025-11-10 in 8.50 sec.
2025-11-14 16:35:44,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-K_2025-11-10' --> 'data\processed_data\EMR\10-K_2025-11-10.md'


2025-11-14 16:35:46,351 - INFO - Going to convert document batch...
2025-11-14 16:35:46,354 - INFO - Processing document 10-Q_2023-02-08
2025-11-14 16:35:48,856 - INFO - Finished converting document 10-Q_2023-02-08 in 4.55 sec.
2025-11-14 16:35:49,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-Q_2023-02-08' --> 'data\processed_data\EMR\10-Q_2023-02-08.md'


2025-11-14 16:35:51,520 - INFO - Going to convert document batch...
2025-11-14 16:35:51,522 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 16:35:54,429 - INFO - Finished converting document 10-Q_2023-05-03 in 4.59 sec.
2025-11-14 16:35:56,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-Q_2023-05-03' --> 'data\processed_data\EMR\10-Q_2023-05-03.md'


2025-11-14 16:35:58,210 - INFO - Going to convert document batch...
2025-11-14 16:35:58,213 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 16:36:01,368 - INFO - Finished converting document 10-Q_2023-08-02 in 5.01 sec.
2025-11-14 16:36:02,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-Q_2023-08-02' --> 'data\processed_data\EMR\10-Q_2023-08-02.md'


2025-11-14 16:36:04,761 - INFO - Going to convert document batch...
2025-11-14 16:36:04,763 - INFO - Processing document 10-Q_2024-02-07
2025-11-14 16:36:06,938 - INFO - Finished converting document 10-Q_2024-02-07 in 4.12 sec.
2025-11-14 16:36:08,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-Q_2024-02-07' --> 'data\processed_data\EMR\10-Q_2024-02-07.md'


2025-11-14 16:36:09,742 - INFO - Going to convert document batch...
2025-11-14 16:36:09,744 - INFO - Processing document 10-Q_2024-05-08
2025-11-14 16:36:12,652 - INFO - Finished converting document 10-Q_2024-05-08 in 4.45 sec.
2025-11-14 16:36:13,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-Q_2024-05-08' --> 'data\processed_data\EMR\10-Q_2024-05-08.md'


2025-11-14 16:36:15,905 - INFO - Going to convert document batch...
2025-11-14 16:36:15,907 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 16:36:18,606 - INFO - Finished converting document 10-Q_2024-08-07 in 4.72 sec.
2025-11-14 16:36:20,023 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-Q_2024-08-07' --> 'data\processed_data\EMR\10-Q_2024-08-07.md'


2025-11-14 16:36:21,499 - INFO - Going to convert document batch...
2025-11-14 16:36:21,501 - INFO - Processing document 10-Q_2025-02-05
2025-11-14 16:36:23,434 - INFO - Finished converting document 10-Q_2025-02-05 in 3.45 sec.
2025-11-14 16:36:24,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-Q_2025-02-05' --> 'data\processed_data\EMR\10-Q_2025-02-05.md'


2025-11-14 16:36:25,714 - INFO - Going to convert document batch...
2025-11-14 16:36:25,717 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 16:36:28,218 - INFO - Finished converting document 10-Q_2025-05-07 in 3.88 sec.
2025-11-14 16:36:29,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\10-Q_2025-05-07' --> 'data\processed_data\EMR\10-Q_2025-05-07.md'


2025-11-14 16:36:31,806 - INFO - Going to convert document batch...
2025-11-14 16:36:31,809 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 16:36:34,440 - INFO - Finished converting document 10-Q_2025-08-06 in 4.78 sec.
2025-11-14 16:36:35,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:35,597 - INFO - Going to convert document batch...
2025-11-14 16:36:35,599 - INFO - Processing document 4_2023-02-09
2025-11-14 16:36:35,673 - INFO - Finished converting document 4_2023-02-09 in 0.14 sec.


Converted 'data\edgar_documents\EMR\10-Q_2025-08-06' --> 'data\processed_data\EMR\10-Q_2025-08-06.md'


2025-11-14 16:36:35,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:35,850 - INFO - Going to convert document batch...
2025-11-14 16:36:35,853 - INFO - Processing document 4_2023-03-06


Converted 'data\edgar_documents\EMR\4_2023-02-09' --> 'data\processed_data\EMR\4_2023-02-09.md'


2025-11-14 16:36:36,057 - INFO - Finished converting document 4_2023-03-06 in 0.30 sec.
2025-11-14 16:36:36,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:36,208 - INFO - Going to convert document batch...
2025-11-14 16:36:36,210 - INFO - Processing document 4_2023-05-03
2025-11-14 16:36:36,321 - INFO - Finished converting document 4_2023-05-03 in 0.17 sec.


Converted 'data\edgar_documents\EMR\4_2023-03-06' --> 'data\processed_data\EMR\4_2023-03-06.md'


2025-11-14 16:36:36,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:36,503 - INFO - Going to convert document batch...
2025-11-14 16:36:36,506 - INFO - Processing document 4_2023-05-04
2025-11-14 16:36:36,589 - INFO - Finished converting document 4_2023-05-04 in 0.16 sec.


Converted 'data\edgar_documents\EMR\4_2023-05-03' --> 'data\processed_data\EMR\4_2023-05-03.md'


2025-11-14 16:36:36,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:36,779 - INFO - Going to convert document batch...
2025-11-14 16:36:36,782 - INFO - Processing document 4_2023-06-29
2025-11-14 16:36:36,869 - INFO - Finished converting document 4_2023-06-29 in 0.17 sec.


Converted 'data\edgar_documents\EMR\4_2023-05-04' --> 'data\processed_data\EMR\4_2023-05-04.md'


2025-11-14 16:36:36,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:37,058 - INFO - Going to convert document batch...
2025-11-14 16:36:37,060 - INFO - Processing document 4_2023-08-07


Converted 'data\edgar_documents\EMR\4_2023-06-29' --> 'data\processed_data\EMR\4_2023-06-29.md'


2025-11-14 16:36:37,225 - INFO - Finished converting document 4_2023-08-07 in 0.25 sec.
2025-11-14 16:36:37,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:37,430 - INFO - Going to convert document batch...
2025-11-14 16:36:37,433 - INFO - Processing document 4_2023-09-07


Converted 'data\edgar_documents\EMR\4_2023-08-07' --> 'data\processed_data\EMR\4_2023-08-07.md'


2025-11-14 16:36:37,531 - INFO - Finished converting document 4_2023-09-07 in 0.19 sec.
2025-11-14 16:36:37,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:37,695 - INFO - Going to convert document batch...
2025-11-14 16:36:37,697 - INFO - Processing document 4_2023-09-08
2025-11-14 16:36:37,807 - INFO - Finished converting document 4_2023-09-08 in 0.19 sec.


Converted 'data\edgar_documents\EMR\4_2023-09-07' --> 'data\processed_data\EMR\4_2023-09-07.md'


2025-11-14 16:36:37,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:38,015 - INFO - Going to convert document batch...
2025-11-14 16:36:38,017 - INFO - Processing document 4_2023-10-11
2025-11-14 16:36:38,088 - INFO - Finished converting document 4_2023-10-11 in 0.16 sec.


Converted 'data\edgar_documents\EMR\4_2023-09-08' --> 'data\processed_data\EMR\4_2023-09-08.md'


2025-11-14 16:36:38,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:38,246 - INFO - Going to convert document batch...
2025-11-14 16:36:38,247 - INFO - Processing document 4_2023-11-08
2025-11-14 16:36:38,327 - INFO - Finished converting document 4_2023-11-08 in 0.16 sec.


Converted 'data\edgar_documents\EMR\4_2023-10-11' --> 'data\processed_data\EMR\4_2023-10-11.md'


2025-11-14 16:36:38,478 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:38,509 - INFO - Going to convert document batch...
2025-11-14 16:36:38,511 - INFO - Processing document 4_2023-11-13
2025-11-14 16:36:38,588 - INFO - Finished converting document 4_2023-11-13 in 0.14 sec.


Converted 'data\edgar_documents\EMR\4_2023-11-08' --> 'data\processed_data\EMR\4_2023-11-08.md'


2025-11-14 16:36:38,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:38,717 - INFO - Going to convert document batch...
2025-11-14 16:36:38,720 - INFO - Processing document 4_2023-11-14
2025-11-14 16:36:38,797 - INFO - Finished converting document 4_2023-11-14 in 0.12 sec.


Converted 'data\edgar_documents\EMR\4_2023-11-13' --> 'data\processed_data\EMR\4_2023-11-13.md'


2025-11-14 16:36:38,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:38,949 - INFO - Going to convert document batch...
2025-11-14 16:36:38,951 - INFO - Processing document 4_2023-11-20
2025-11-14 16:36:39,048 - INFO - Finished converting document 4_2023-11-20 in 0.16 sec.


Converted 'data\edgar_documents\EMR\4_2023-11-14' --> 'data\processed_data\EMR\4_2023-11-14.md'


2025-11-14 16:36:39,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:39,231 - INFO - Going to convert document batch...
2025-11-14 16:36:39,234 - INFO - Processing document 4_2023-12-18
2025-11-14 16:36:39,325 - INFO - Finished converting document 4_2023-12-18 in 0.19 sec.


Converted 'data\edgar_documents\EMR\4_2023-11-20' --> 'data\processed_data\EMR\4_2023-11-20.md'


2025-11-14 16:36:39,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:39,482 - INFO - Going to convert document batch...
2025-11-14 16:36:39,485 - INFO - Processing document 4_2024-01-03
2025-11-14 16:36:39,589 - INFO - Finished converting document 4_2024-01-03 in 0.19 sec.


Converted 'data\edgar_documents\EMR\4_2023-12-18' --> 'data\processed_data\EMR\4_2023-12-18.md'


2025-11-14 16:36:39,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:39,787 - INFO - Going to convert document batch...
2025-11-14 16:36:39,791 - INFO - Processing document 4_2024-02-08
2025-11-14 16:36:39,867 - INFO - Finished converting document 4_2024-02-08 in 0.17 sec.


Converted 'data\edgar_documents\EMR\4_2024-01-03' --> 'data\processed_data\EMR\4_2024-01-03.md'


2025-11-14 16:36:39,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:39,992 - INFO - Going to convert document batch...
2025-11-14 16:36:39,994 - INFO - Processing document 4_2024-02-13
2025-11-14 16:36:40,088 - INFO - Finished converting document 4_2024-02-13 in 0.16 sec.


Converted 'data\edgar_documents\EMR\4_2024-02-08' --> 'data\processed_data\EMR\4_2024-02-08.md'


2025-11-14 16:36:40,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:40,226 - INFO - Going to convert document batch...
2025-11-14 16:36:40,227 - INFO - Processing document 4_2024-02-16
2025-11-14 16:36:40,309 - INFO - Finished converting document 4_2024-02-16 in 0.14 sec.


Converted 'data\edgar_documents\EMR\4_2024-02-13' --> 'data\processed_data\EMR\4_2024-02-13.md'


2025-11-14 16:36:40,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:40,541 - INFO - Going to convert document batch...
2025-11-14 16:36:40,544 - INFO - Processing document 4_2024-03-05


Converted 'data\edgar_documents\EMR\4_2024-02-16' --> 'data\processed_data\EMR\4_2024-02-16.md'


2025-11-14 16:36:40,626 - INFO - Finished converting document 4_2024-03-05 in 0.23 sec.
2025-11-14 16:36:40,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:40,811 - INFO - Going to convert document batch...
2025-11-14 16:36:40,813 - INFO - Processing document 4_2024-06-28


Converted 'data\edgar_documents\EMR\4_2024-03-05' --> 'data\processed_data\EMR\4_2024-03-05.md'


2025-11-14 16:36:40,945 - INFO - Finished converting document 4_2024-06-28 in 0.23 sec.
2025-11-14 16:36:41,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:41,260 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\EMR\4_2024-06-28' --> 'data\processed_data\EMR\4_2024-06-28.md'


2025-11-14 16:36:41,263 - INFO - Processing document 4_2024-08-05
2025-11-14 16:36:41,341 - INFO - Finished converting document 4_2024-08-05 in 0.27 sec.
2025-11-14 16:36:41,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:41,503 - INFO - Going to convert document batch...
2025-11-14 16:36:41,504 - INFO - Processing document 4_2024-10-09
2025-11-14 16:36:41,587 - INFO - Finished converting document 4_2024-10-09 in 0.16 sec.


Converted 'data\edgar_documents\EMR\4_2024-08-05' --> 'data\processed_data\EMR\4_2024-08-05.md'


2025-11-14 16:36:41,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:41,740 - INFO - Going to convert document batch...
2025-11-14 16:36:41,742 - INFO - Processing document 4_2024-11-06
2025-11-14 16:36:41,836 - INFO - Finished converting document 4_2024-11-06 in 0.17 sec.


Converted 'data\edgar_documents\EMR\4_2024-10-09' --> 'data\processed_data\EMR\4_2024-10-09.md'


2025-11-14 16:36:41,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:42,007 - INFO - Going to convert document batch...
2025-11-14 16:36:42,009 - INFO - Processing document 4_2024-11-08
2025-11-14 16:36:42,095 - INFO - Finished converting document 4_2024-11-08 in 0.17 sec.


Converted 'data\edgar_documents\EMR\4_2024-11-06' --> 'data\processed_data\EMR\4_2024-11-06.md'


2025-11-14 16:36:42,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:42,246 - INFO - Going to convert document batch...
2025-11-14 16:36:42,248 - INFO - Processing document 4_2024-11-14
2025-11-14 16:36:42,334 - INFO - Finished converting document 4_2024-11-14 in 0.12 sec.


Converted 'data\edgar_documents\EMR\4_2024-11-08' --> 'data\processed_data\EMR\4_2024-11-08.md'


2025-11-14 16:36:42,490 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:42,527 - INFO - Going to convert document batch...
2025-11-14 16:36:42,528 - INFO - Processing document 4_2024-11-15
2025-11-14 16:36:42,617 - INFO - Finished converting document 4_2024-11-15 in 0.17 sec.


Converted 'data\edgar_documents\EMR\4_2024-11-14' --> 'data\processed_data\EMR\4_2024-11-14.md'


2025-11-14 16:36:42,721 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:42,757 - INFO - Going to convert document batch...
2025-11-14 16:36:42,758 - INFO - Processing document 4_2024-11-25
2025-11-14 16:36:42,871 - INFO - Finished converting document 4_2024-11-25 in 0.17 sec.


Converted 'data\edgar_documents\EMR\4_2024-11-15' --> 'data\processed_data\EMR\4_2024-11-15.md'


2025-11-14 16:36:42,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:43,012 - INFO - Going to convert document batch...
2025-11-14 16:36:43,014 - INFO - Processing document 4_2024-12-19
2025-11-14 16:36:43,122 - INFO - Finished converting document 4_2024-12-19 in 0.17 sec.


Converted 'data\edgar_documents\EMR\4_2024-11-25' --> 'data\processed_data\EMR\4_2024-11-25.md'


2025-11-14 16:36:43,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:43,286 - INFO - Going to convert document batch...
2025-11-14 16:36:43,288 - INFO - Processing document 4_2025-01-06
2025-11-14 16:36:43,348 - INFO - Finished converting document 4_2025-01-06 in 0.12 sec.


Converted 'data\edgar_documents\EMR\4_2024-12-19' --> 'data\processed_data\EMR\4_2024-12-19.md'


2025-11-14 16:36:43,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:43,482 - INFO - Going to convert document batch...
2025-11-14 16:36:43,483 - INFO - Processing document 4_2025-02-06
2025-11-14 16:36:43,546 - INFO - Finished converting document 4_2025-02-06 in 0.11 sec.


Converted 'data\edgar_documents\EMR\4_2025-01-06' --> 'data\processed_data\EMR\4_2025-01-06.md'
Converted 'data\edgar_documents\EMR\4_2025-02-06' --> 'data\processed_data\EMR\4_2025-02-06.md'


2025-11-14 16:36:43,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:43,688 - INFO - Going to convert document batch...
2025-11-14 16:36:43,691 - INFO - Processing document 4_2025-02-12
2025-11-14 16:36:43,757 - INFO - Finished converting document 4_2025-02-12 in 0.14 sec.
2025-11-14 16:36:43,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:43,889 - INFO - Going to convert document batch...
2025-11-14 16:36:43,890 - INFO - Processing document 4_2025-02-13
2025-11-14 16:36:43,956 - INFO - Finished converting document 4_2025-02-13 in 0.14 sec.


Converted 'data\edgar_documents\EMR\4_2025-02-12' --> 'data\processed_data\EMR\4_2025-02-12.md'


2025-11-14 16:36:44,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:44,068 - INFO - Going to convert document batch...
2025-11-14 16:36:44,070 - INFO - Processing document 4_2025-02-14
2025-11-14 16:36:44,135 - INFO - Finished converting document 4_2025-02-14 in 0.09 sec.


Converted 'data\edgar_documents\EMR\4_2025-02-13' --> 'data\processed_data\EMR\4_2025-02-13.md'
Converted 'data\edgar_documents\EMR\4_2025-02-14' --> 'data\processed_data\EMR\4_2025-02-14.md'


2025-11-14 16:36:44,279 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:36:44,280 - ERROR - Input document 4_2025-02-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:36:44,283 - INFO - Going to convert document batch...
2025-11-14 16:36:44,312 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:36:44,313 - ERROR - Input document 4_2025-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\EMR\4_2025-02-25: File format not allowed: data\edgar_documents\EMR\4_2025-02-25
Error processing data\edgar_documents\EMR\4_2025-02-27: File format not allowed: data\edgar_documents\EMR\4_2025-02-27


2025-11-14 16:36:44,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:44,671 - INFO - Going to convert document batch...
2025-11-14 16:36:44,673 - INFO - Processing document 4_2025-05-13
2025-11-14 16:36:44,738 - INFO - Finished converting document 4_2025-05-13 in 0.14 sec.


Converted 'data\edgar_documents\EMR\4_2025-05-09' --> 'data\processed_data\EMR\4_2025-05-09.md'


2025-11-14 16:36:44,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:44,884 - INFO - Going to convert document batch...
2025-11-14 16:36:44,885 - INFO - Processing document 4_2025-11-05


Converted 'data\edgar_documents\EMR\4_2025-05-13' --> 'data\processed_data\EMR\4_2025-05-13.md'


2025-11-14 16:36:45,486 - INFO - Finished converting document 4_2025-11-05 in 0.69 sec.
2025-11-14 16:36:45,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:45,646 - INFO - Going to convert document batch...
2025-11-14 16:36:45,647 - INFO - Processing document 4_2025-11-06
2025-11-14 16:36:45,713 - INFO - Finished converting document 4_2025-11-06 in 0.16 sec.


Converted 'data\edgar_documents\EMR\4_2025-11-05' --> 'data\processed_data\EMR\4_2025-11-05.md'


2025-11-14 16:36:45,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:45,826 - INFO - Going to convert document batch...
2025-11-14 16:36:45,828 - INFO - Processing document 4_2025-11-10
2025-11-14 16:36:45,899 - INFO - Finished converting document 4_2025-11-10 in 0.11 sec.


Converted 'data\edgar_documents\EMR\4_2025-11-06' --> 'data\processed_data\EMR\4_2025-11-06.md'
Converted 'data\edgar_documents\EMR\4_2025-11-10' --> 'data\processed_data\EMR\4_2025-11-10.md'


2025-11-14 16:36:46,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:46,068 - INFO - Going to convert document batch...
2025-11-14 16:36:46,071 - INFO - Processing document 8-K_2023-02-08
2025-11-14 16:36:46,135 - INFO - Finished converting document 8-K_2023-02-08 in 0.17 sec.
2025-11-14 16:36:46,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:46,303 - INFO - Going to convert document batch...
2025-11-14 16:36:46,305 - INFO - Processing document 8-K_2023-02-10
2025-11-14 16:36:46,395 - INFO - Finished converting document 8-K_2023-02-10 in 0.20 sec.


Converted 'data\edgar_documents\EMR\8-K_2023-02-08' --> 'data\processed_data\EMR\8-K_2023-02-08.md'


2025-11-14 16:36:46,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:46,531 - INFO - Going to convert document batch...
2025-11-14 16:36:46,532 - INFO - Processing document 8-K_2023-02-21
2025-11-14 16:36:46,620 - INFO - Finished converting document 8-K_2023-02-21 in 0.19 sec.


Converted 'data\edgar_documents\EMR\8-K_2023-02-10' --> 'data\processed_data\EMR\8-K_2023-02-10.md'


2025-11-14 16:36:46,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:46,830 - INFO - Going to convert document batch...
2025-11-14 16:36:46,833 - INFO - Processing document 8-K_2023-04-06
2025-11-14 16:36:46,892 - INFO - Finished converting document 8-K_2023-04-06 in 0.16 sec.


Converted 'data\edgar_documents\EMR\8-K_2023-02-21' --> 'data\processed_data\EMR\8-K_2023-02-21.md'


2025-11-14 16:36:46,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:47,044 - INFO - Going to convert document batch...
2025-11-14 16:36:47,045 - INFO - Processing document 8-K_2023-04-12


Converted 'data\edgar_documents\EMR\8-K_2023-04-06' --> 'data\processed_data\EMR\8-K_2023-04-06.md'


2025-11-14 16:36:47,190 - INFO - Finished converting document 8-K_2023-04-12 in 0.27 sec.
2025-11-14 16:36:47,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:47,435 - INFO - Going to convert document batch...
2025-11-14 16:36:47,437 - INFO - Processing document 8-K_2023-05-02
2025-11-14 16:36:47,505 - INFO - Finished converting document 8-K_2023-05-02 in 0.17 sec.


Converted 'data\edgar_documents\EMR\8-K_2023-04-12' --> 'data\processed_data\EMR\8-K_2023-04-12.md'


2025-11-14 16:36:47,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:47,604 - INFO - Going to convert document batch...
2025-11-14 16:36:47,607 - INFO - Processing document 8-K_2023-05-03
2025-11-14 16:36:47,711 - INFO - Finished converting document 8-K_2023-05-03 in 0.16 sec.


Converted 'data\edgar_documents\EMR\8-K_2023-05-02' --> 'data\processed_data\EMR\8-K_2023-05-02.md'


2025-11-14 16:36:47,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:47,854 - INFO - Going to convert document batch...
2025-11-14 16:36:47,856 - INFO - Processing document 8-K_2023-06-02
2025-11-14 16:36:47,932 - INFO - Finished converting document 8-K_2023-06-02 in 0.17 sec.


Converted 'data\edgar_documents\EMR\8-K_2023-05-03' --> 'data\processed_data\EMR\8-K_2023-05-03.md'


2025-11-14 16:36:48,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:48,102 - INFO - Going to convert document batch...
2025-11-14 16:36:48,103 - INFO - Processing document 8-K_2023-08-02


Converted 'data\edgar_documents\EMR\8-K_2023-06-02' --> 'data\processed_data\EMR\8-K_2023-06-02.md'


2025-11-14 16:36:48,177 - INFO - Finished converting document 8-K_2023-08-02 in 0.19 sec.
2025-11-14 16:36:48,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:48,320 - INFO - Going to convert document batch...
2025-11-14 16:36:48,322 - INFO - Processing document 8-K_2023-10-11
2025-11-14 16:36:48,403 - INFO - Finished converting document 8-K_2023-10-11 in 0.19 sec.


Converted 'data\edgar_documents\EMR\8-K_2023-08-02' --> 'data\processed_data\EMR\8-K_2023-08-02.md'


2025-11-14 16:36:48,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:48,574 - INFO - Going to convert document batch...
2025-11-14 16:36:48,576 - INFO - Processing document 8-K_2023-11-07
2025-11-14 16:36:48,634 - INFO - Finished converting document 8-K_2023-11-07 in 0.16 sec.


Converted 'data\edgar_documents\EMR\8-K_2023-10-11' --> 'data\processed_data\EMR\8-K_2023-10-11.md'


2025-11-14 16:36:48,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:48,760 - INFO - Going to convert document batch...
2025-11-14 16:36:48,763 - INFO - Processing document 8-K_2023-11-30
2025-11-14 16:36:48,830 - INFO - Finished converting document 8-K_2023-11-30 in 0.16 sec.


Converted 'data\edgar_documents\EMR\8-K_2023-11-07' --> 'data\processed_data\EMR\8-K_2023-11-07.md'
Converted 'data\edgar_documents\EMR\8-K_2023-11-30' --> 'data\processed_data\EMR\8-K_2023-11-30.md'


2025-11-14 16:36:48,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:48,974 - INFO - Going to convert document batch...
2025-11-14 16:36:48,977 - INFO - Processing document 8-K_2024-02-07
2025-11-14 16:36:49,055 - INFO - Finished converting document 8-K_2024-02-07 in 0.17 sec.
2025-11-14 16:36:49,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:49,189 - INFO - Going to convert document batch...
2025-11-14 16:36:49,190 - INFO - Processing document 8-K_2024-02-09


Converted 'data\edgar_documents\EMR\8-K_2024-02-07' --> 'data\processed_data\EMR\8-K_2024-02-07.md'


2025-11-14 16:36:49,286 - INFO - Finished converting document 8-K_2024-02-09 in 0.19 sec.
2025-11-14 16:36:49,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:49,438 - INFO - Going to convert document batch...
2025-11-14 16:36:49,440 - INFO - Processing document 8-K_2024-05-08
2025-11-14 16:36:49,507 - INFO - Finished converting document 8-K_2024-05-08 in 0.16 sec.


Converted 'data\edgar_documents\EMR\8-K_2024-02-09' --> 'data\processed_data\EMR\8-K_2024-02-09.md'


2025-11-14 16:36:49,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:49,656 - INFO - Going to convert document batch...
2025-11-14 16:36:49,657 - INFO - Processing document 8-K_2024-06-06
2025-11-14 16:36:49,754 - INFO - Finished converting document 8-K_2024-06-06 in 0.19 sec.


Converted 'data\edgar_documents\EMR\8-K_2024-05-08' --> 'data\processed_data\EMR\8-K_2024-05-08.md'


2025-11-14 16:36:49,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:49,919 - INFO - Going to convert document batch...
2025-11-14 16:36:49,921 - INFO - Processing document 8-K_2024-08-07
2025-11-14 16:36:49,993 - INFO - Finished converting document 8-K_2024-08-07 in 0.16 sec.


Converted 'data\edgar_documents\EMR\8-K_2024-06-06' --> 'data\processed_data\EMR\8-K_2024-06-06.md'


2025-11-14 16:36:50,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:50,134 - INFO - Going to convert document batch...
2025-11-14 16:36:50,135 - INFO - Processing document 8-K_2024-11-05


Converted 'data\edgar_documents\EMR\8-K_2024-08-07' --> 'data\processed_data\EMR\8-K_2024-08-07.md'


2025-11-14 16:36:50,266 - INFO - Finished converting document 8-K_2024-11-05 in 0.22 sec.
2025-11-14 16:36:50,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:50,481 - INFO - Going to convert document batch...
2025-11-14 16:36:50,483 - INFO - Processing document 8-K_2025-01-27


Converted 'data\edgar_documents\EMR\8-K_2024-11-05' --> 'data\processed_data\EMR\8-K_2024-11-05.md'


2025-11-14 16:36:50,613 - INFO - Finished converting document 8-K_2025-01-27 in 0.25 sec.
2025-11-14 16:36:50,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:50,966 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\EMR\8-K_2025-01-27' --> 'data\processed_data\EMR\8-K_2025-01-27.md'


2025-11-14 16:36:50,968 - INFO - Processing document 8-K_2025-02-05
2025-11-14 16:36:51,046 - INFO - Finished converting document 8-K_2025-02-05 in 0.30 sec.
2025-11-14 16:36:51,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:51,216 - INFO - Going to convert document batch...
2025-11-14 16:36:51,218 - INFO - Processing document 8-K_2025-02-07


Converted 'data\edgar_documents\EMR\8-K_2025-02-05' --> 'data\processed_data\EMR\8-K_2025-02-05.md'


2025-11-14 16:36:51,366 - INFO - Finished converting document 8-K_2025-02-07 in 0.23 sec.
2025-11-14 16:36:51,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:51,489 - INFO - Going to convert document batch...
2025-11-14 16:36:51,491 - INFO - Processing document 8-K_2025-02-14
2025-11-14 16:36:51,583 - INFO - Finished converting document 8-K_2025-02-14 in 0.14 sec.


Converted 'data\edgar_documents\EMR\8-K_2025-02-07' --> 'data\processed_data\EMR\8-K_2025-02-07.md'


2025-11-14 16:36:51,687 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:36:51,689 - ERROR - Input document 8-K_2025-02-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:36:51,691 - INFO - Going to convert document batch...
2025-11-14 16:36:51,715 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:36:51,717 - ERROR - Input document 8-K_2025-03-04 with format None does 

Converted 'data\edgar_documents\EMR\8-K_2025-02-14' --> 'data\processed_data\EMR\8-K_2025-02-14.md'
Error processing data\edgar_documents\EMR\8-K_2025-02-28: File format not allowed: data\edgar_documents\EMR\8-K_2025-02-28
Error processing data\edgar_documents\EMR\8-K_2025-03-04: File format not allowed: data\edgar_documents\EMR\8-K_2025-03-04
Error processing data\edgar_documents\EMR\8-K_2025-03-10: File format not allowed: data\edgar_documents\EMR\8-K_2025-03-10


2025-11-14 16:36:51,832 - INFO - Processing document 8-K_2025-03-12
2025-11-14 16:36:51,904 - INFO - Finished converting document 8-K_2025-03-12 in 0.14 sec.
2025-11-14 16:36:51,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:52,031 - INFO - Going to convert document batch...
2025-11-14 16:36:52,034 - INFO - Processing document 8-K_2025-05-07
2025-11-14 16:36:52,121 - INFO - Finished converting document 8-K_2025-05-07 in 0.17 sec.


Converted 'data\edgar_documents\EMR\8-K_2025-03-12' --> 'data\processed_data\EMR\8-K_2025-03-12.md'


2025-11-14 16:36:52,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:52,266 - INFO - Going to convert document batch...
2025-11-14 16:36:52,267 - INFO - Processing document 8-K_2025-08-06


Converted 'data\edgar_documents\EMR\8-K_2025-05-07' --> 'data\processed_data\EMR\8-K_2025-05-07.md'


2025-11-14 16:36:52,346 - INFO - Finished converting document 8-K_2025-08-06 in 0.19 sec.
2025-11-14 16:36:52,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:36:52,494 - INFO - Going to convert document batch...
2025-11-14 16:36:52,496 - INFO - Processing document 8-K_2025-11-05
2025-11-14 16:36:52,570 - INFO - Finished converting document 8-K_2025-11-05 in 0.17 sec.


Converted 'data\edgar_documents\EMR\8-K_2025-08-06' --> 'data\processed_data\EMR\8-K_2025-08-06.md'


2025-11-14 16:36:52,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\8-K_2025-11-05' --> 'data\processed_data\EMR\8-K_2025-11-05.md'


2025-11-14 16:36:55,247 - INFO - Going to convert document batch...
2025-11-14 16:36:55,251 - INFO - Processing document DEF-14A_2023-12-08
2025-11-14 16:36:59,206 - INFO - Finished converting document DEF-14A_2023-12-08 in 6.59 sec.
2025-11-14 16:37:01,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\EMR\DEF-14A_2023-12-08' --> 'data\processed_data\EMR\DEF-14A_2023-12-08.md'


2025-11-14 16:37:03,564 - INFO - Going to convert document batch...
2025-11-14 16:37:03,565 - INFO - Processing document DEF-14A_2024-12-13
2025-11-14 16:37:11,147 - INFO - Finished converting document DEF-14A_2024-12-13 in 9.41 sec.


Converted 'data\edgar_documents\EMR\DEF-14A_2024-12-13' --> 'data\processed_data\EMR\DEF-14A_2024-12-13.md'
Processed 78 new files. Errors: 5
Found 103 files to process in data\edgar_documents\FDX


2025-11-14 16:37:14,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:37:20,378 - INFO - Going to convert document batch...
2025-11-14 16:37:20,380 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:37:20,382 - INFO - Processing document 10-K_2023-07-17
2025-11-14 16:37:34,746 - INFO - Finished converting document 10-K_2023-07-17 in 20.92 sec.
2025-11-14 16:37:37,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-K_2023-07-17' --> 'data\processed_data\FDX\10-K_2023-07-17.md'


2025-11-14 16:37:42,893 - INFO - Going to convert document batch...
2025-11-14 16:37:42,895 - INFO - Processing document 10-K_2024-07-15
2025-11-14 16:37:56,231 - INFO - Finished converting document 10-K_2024-07-15 in 19.33 sec.
2025-11-14 16:37:58,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-K_2024-07-15' --> 'data\processed_data\FDX\10-K_2024-07-15.md'


2025-11-14 16:38:01,085 - INFO - Going to convert document batch...
2025-11-14 16:38:01,087 - INFO - Processing document 10-K_2025-07-21
2025-11-14 16:38:08,113 - INFO - Finished converting document 10-K_2025-07-21 in 9.66 sec.
2025-11-14 16:38:10,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-K_2025-07-21' --> 'data\processed_data\FDX\10-K_2025-07-21.md'


2025-11-14 16:38:15,178 - INFO - Going to convert document batch...
2025-11-14 16:38:15,179 - INFO - Processing document 10-Q_2023-03-16
2025-11-14 16:38:19,229 - INFO - Finished converting document 10-Q_2023-03-16 in 8.58 sec.
2025-11-14 16:38:20,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-Q_2023-03-16' --> 'data\processed_data\FDX\10-Q_2023-03-16.md'


2025-11-14 16:38:21,888 - INFO - Going to convert document batch...
2025-11-14 16:38:21,890 - INFO - Processing document 10-Q_2023-09-20
2025-11-14 16:38:25,098 - INFO - Finished converting document 10-Q_2023-09-20 in 5.14 sec.
2025-11-14 16:38:25,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-Q_2023-09-20' --> 'data\processed_data\FDX\10-Q_2023-09-20.md'


2025-11-14 16:38:28,219 - INFO - Going to convert document batch...
2025-11-14 16:38:28,221 - INFO - Processing document 10-Q_2023-12-19
2025-11-14 16:38:31,735 - INFO - Finished converting document 10-Q_2023-12-19 in 6.17 sec.
2025-11-14 16:38:33,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-Q_2023-12-19' --> 'data\processed_data\FDX\10-Q_2023-12-19.md'


2025-11-14 16:38:35,324 - INFO - Going to convert document batch...
2025-11-14 16:38:35,325 - INFO - Processing document 10-Q_2024-03-21
2025-11-14 16:38:39,233 - INFO - Finished converting document 10-Q_2024-03-21 in 6.20 sec.
2025-11-14 16:38:40,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-Q_2024-03-21' --> 'data\processed_data\FDX\10-Q_2024-03-21.md'


2025-11-14 16:38:41,600 - INFO - Going to convert document batch...
2025-11-14 16:38:41,601 - INFO - Processing document 10-Q_2024-09-19
2025-11-14 16:38:43,855 - INFO - Finished converting document 10-Q_2024-09-19 in 3.81 sec.
2025-11-14 16:38:44,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-Q_2024-09-19' --> 'data\processed_data\FDX\10-Q_2024-09-19.md'


2025-11-14 16:38:47,913 - INFO - Going to convert document batch...
2025-11-14 16:38:47,915 - INFO - Processing document 10-Q_2024-12-19
2025-11-14 16:38:51,132 - INFO - Finished converting document 10-Q_2024-12-19 in 6.77 sec.
2025-11-14 16:38:51,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-Q_2024-12-19' --> 'data\processed_data\FDX\10-Q_2024-12-19.md'


2025-11-14 16:38:54,751 - INFO - Going to convert document batch...
2025-11-14 16:38:54,752 - INFO - Processing document 10-Q_2025-03-20
2025-11-14 16:38:57,989 - INFO - Finished converting document 10-Q_2025-03-20 in 6.23 sec.
2025-11-14 16:38:58,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\10-Q_2025-03-20' --> 'data\processed_data\FDX\10-Q_2025-03-20.md'


2025-11-14 16:38:59,853 - INFO - Going to convert document batch...
2025-11-14 16:38:59,854 - INFO - Processing document 10-Q_2025-09-18
2025-11-14 16:39:02,266 - INFO - Finished converting document 10-Q_2025-09-18 in 3.59 sec.
2025-11-14 16:39:03,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:03,115 - INFO - Going to convert document batch...
2025-11-14 16:39:03,116 - INFO - Processing document 4_2023-01-03
2025-11-14 16:39:03,206 - INFO - Finished converting document 4_2023-01-03 in 0.16 sec.


Converted 'data\edgar_documents\FDX\10-Q_2025-09-18' --> 'data\processed_data\FDX\10-Q_2025-09-18.md'


2025-11-14 16:39:03,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:03,316 - INFO - Going to convert document batch...
2025-11-14 16:39:03,318 - INFO - Processing document 4_2023-01-13
2025-11-14 16:39:03,386 - INFO - Finished converting document 4_2023-01-13 in 0.12 sec.


Converted 'data\edgar_documents\FDX\4_2023-01-03' --> 'data\processed_data\FDX\4_2023-01-03.md'
Converted 'data\edgar_documents\FDX\4_2023-01-13' --> 'data\processed_data\FDX\4_2023-01-13.md'


2025-11-14 16:39:03,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:03,546 - INFO - Going to convert document batch...
2025-11-14 16:39:03,547 - INFO - Processing document 4_2023-04-06
2025-11-14 16:39:03,639 - INFO - Finished converting document 4_2023-04-06 in 0.19 sec.
2025-11-14 16:39:03,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:03,817 - INFO - Going to convert document batch...
2025-11-14 16:39:03,818 - INFO - Processing document 4_2023-04-10
2025-11-14 16:39:03,887 - INFO - Finished converting document 4_2023-04-10 in 0.16 sec.


Converted 'data\edgar_documents\FDX\4_2023-04-06' --> 'data\processed_data\FDX\4_2023-04-06.md'


2025-11-14 16:39:04,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:04,065 - INFO - Going to convert document batch...
2025-11-14 16:39:04,066 - INFO - Processing document 4_2023-04-12
2025-11-14 16:39:04,148 - INFO - Finished converting document 4_2023-04-12 in 0.17 sec.


Converted 'data\edgar_documents\FDX\4_2023-04-10' --> 'data\processed_data\FDX\4_2023-04-10.md'


2025-11-14 16:39:04,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:04,308 - INFO - Going to convert document batch...
2025-11-14 16:39:04,309 - INFO - Processing document 4_2023-04-13
2025-11-14 16:39:04,369 - INFO - Finished converting document 4_2023-04-13 in 0.12 sec.


Converted 'data\edgar_documents\FDX\4_2023-04-12' --> 'data\processed_data\FDX\4_2023-04-12.md'


2025-11-14 16:39:04,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:04,490 - INFO - Going to convert document batch...
2025-11-14 16:39:04,491 - INFO - Processing document 4_2023-06-23
2025-11-14 16:39:04,553 - INFO - Finished converting document 4_2023-06-23 in 0.11 sec.


Converted 'data\edgar_documents\FDX\4_2023-04-13' --> 'data\processed_data\FDX\4_2023-04-13.md'


2025-11-14 16:39:04,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:04,711 - INFO - Going to convert document batch...
2025-11-14 16:39:04,713 - INFO - Processing document 4_2023-06-27
2025-11-14 16:39:04,799 - INFO - Finished converting document 4_2023-06-27 in 0.16 sec.


Converted 'data\edgar_documents\FDX\4_2023-06-23' --> 'data\processed_data\FDX\4_2023-06-23.md'


2025-11-14 16:39:04,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:04,936 - INFO - Going to convert document batch...
2025-11-14 16:39:04,937 - INFO - Processing document 4_2023-06-28
2025-11-14 16:39:05,013 - INFO - Finished converting document 4_2023-06-28 in 0.12 sec.


Converted 'data\edgar_documents\FDX\4_2023-06-27' --> 'data\processed_data\FDX\4_2023-06-27.md'


2025-11-14 16:39:05,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:05,189 - INFO - Going to convert document batch...
2025-11-14 16:39:05,190 - INFO - Processing document 4_2023-07-20
2025-11-14 16:39:05,259 - INFO - Finished converting document 4_2023-07-20 in 0.14 sec.


Converted 'data\edgar_documents\FDX\4_2023-06-28' --> 'data\processed_data\FDX\4_2023-06-28.md'


2025-11-14 16:39:05,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:05,415 - INFO - Going to convert document batch...
2025-11-14 16:39:05,416 - INFO - Processing document 4_2023-07-21
2025-11-14 16:39:05,475 - INFO - Finished converting document 4_2023-07-21 in 0.12 sec.


Converted 'data\edgar_documents\FDX\4_2023-07-20' --> 'data\processed_data\FDX\4_2023-07-20.md'
Converted 'data\edgar_documents\FDX\4_2023-07-21' --> 'data\processed_data\FDX\4_2023-07-21.md'


2025-11-14 16:39:05,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:05,583 - INFO - Going to convert document batch...
2025-11-14 16:39:05,585 - INFO - Processing document 4_2023-09-25
2025-11-14 16:39:05,640 - INFO - Finished converting document 4_2023-09-25 in 0.11 sec.
2025-11-14 16:39:05,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:05,772 - INFO - Going to convert document batch...
2025-11-14 16:39:05,774 - INFO - Processing document 4_2023-09-29
2025-11-14 16:39:05,816 - INFO - Finished converting document 4_2023-09-29 in 0.11 sec.
2025-11-14 16:39:05,889 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\4_2023-09-25' --> 'data\processed_data\FDX\4_2023-09-25.md'
Converted 'data\edgar_documents\FDX\4_2023-09-29' --> 'data\processed_data\FDX\4_2023-09-29.md'


2025-11-14 16:39:05,925 - INFO - Going to convert document batch...
2025-11-14 16:39:05,926 - INFO - Processing document 4_2023-10-06
2025-11-14 16:39:06,007 - INFO - Finished converting document 4_2023-10-06 in 0.12 sec.
2025-11-14 16:39:06,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:06,172 - INFO - Going to convert document batch...
2025-11-14 16:39:06,174 - INFO - Processing document 4_2023-12-26
2025-11-14 16:39:06,234 - INFO - Finished converting document 4_2023-12-26 in 0.16 sec.


Converted 'data\edgar_documents\FDX\4_2023-10-06' --> 'data\processed_data\FDX\4_2023-10-06.md'


2025-11-14 16:39:06,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:06,379 - INFO - Going to convert document batch...
2025-11-14 16:39:06,381 - INFO - Processing document 4_2023-12-27
2025-11-14 16:39:06,455 - INFO - Finished converting document 4_2023-12-27 in 0.16 sec.


Converted 'data\edgar_documents\FDX\4_2023-12-26' --> 'data\processed_data\FDX\4_2023-12-26.md'


2025-11-14 16:39:06,556 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:06,577 - INFO - Going to convert document batch...
2025-11-14 16:39:06,579 - INFO - Processing document 4_2023-12-28
2025-11-14 16:39:06,644 - INFO - Finished converting document 4_2023-12-28 in 0.11 sec.
2025-11-14 16:39:06,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\4_2023-12-27' --> 'data\processed_data\FDX\4_2023-12-27.md'
Converted 'data\edgar_documents\FDX\4_2023-12-28' --> 'data\processed_data\FDX\4_2023-12-28.md'


2025-11-14 16:39:06,755 - INFO - Going to convert document batch...
2025-11-14 16:39:06,756 - INFO - Processing document 4_2024-01-08
2025-11-14 16:39:06,850 - INFO - Finished converting document 4_2024-01-08 in 0.14 sec.
2025-11-14 16:39:06,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:07,094 - INFO - Going to convert document batch...
2025-11-14 16:39:07,096 - INFO - Processing document 4_2024-03-27


Converted 'data\edgar_documents\FDX\4_2024-01-08' --> 'data\processed_data\FDX\4_2024-01-08.md'


2025-11-14 16:39:07,834 - INFO - Finished converting document 4_2024-03-27 in 0.91 sec.
2025-11-14 16:39:07,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:07,973 - INFO - Going to convert document batch...
2025-11-14 16:39:07,974 - INFO - Processing document 4_2024-03-28
2025-11-14 16:39:08,028 - INFO - Finished converting document 4_2024-03-28 in 0.12 sec.


Converted 'data\edgar_documents\FDX\4_2024-03-27' --> 'data\processed_data\FDX\4_2024-03-27.md'
Converted 'data\edgar_documents\FDX\4_2024-03-28' --> 'data\processed_data\FDX\4_2024-03-28.md'


2025-11-14 16:39:08,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:08,151 - INFO - Going to convert document batch...
2025-11-14 16:39:08,152 - INFO - Processing document 4_2024-04-04
2025-11-14 16:39:08,222 - INFO - Finished converting document 4_2024-04-04 in 0.14 sec.
2025-11-14 16:39:08,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:08,411 - INFO - Going to convert document batch...
2025-11-14 16:39:08,412 - INFO - Processing document 4_2024-04-05
2025-11-14 16:39:08,496 - INFO - Finished converting document 4_2024-04-05 in 0.19 sec.


Converted 'data\edgar_documents\FDX\4_2024-04-04' --> 'data\processed_data\FDX\4_2024-04-04.md'


2025-11-14 16:39:08,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:08,633 - INFO - Going to convert document batch...
2025-11-14 16:39:08,635 - INFO - Processing document 4_2024-04-08
2025-11-14 16:39:08,721 - INFO - Finished converting document 4_2024-04-08 in 0.16 sec.


Converted 'data\edgar_documents\FDX\4_2024-04-05' --> 'data\processed_data\FDX\4_2024-04-05.md'


2025-11-14 16:39:08,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:08,881 - INFO - Going to convert document batch...
2025-11-14 16:39:08,882 - INFO - Processing document 4_2024-04-09
2025-11-14 16:39:08,961 - INFO - Finished converting document 4_2024-04-09 in 0.16 sec.


Converted 'data\edgar_documents\FDX\4_2024-04-08' --> 'data\processed_data\FDX\4_2024-04-08.md'


2025-11-14 16:39:09,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:09,118 - INFO - Going to convert document batch...
2025-11-14 16:39:09,119 - INFO - Processing document 4_2024-06-28
2025-11-14 16:39:09,189 - INFO - Finished converting document 4_2024-06-28 in 0.14 sec.


Converted 'data\edgar_documents\FDX\4_2024-04-09' --> 'data\processed_data\FDX\4_2024-04-09.md'


2025-11-14 16:39:09,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:09,340 - INFO - Going to convert document batch...
2025-11-14 16:39:09,341 - INFO - Processing document 4_2024-07-01
2025-11-14 16:39:09,421 - INFO - Finished converting document 4_2024-07-01 in 0.12 sec.


Converted 'data\edgar_documents\FDX\4_2024-06-28' --> 'data\processed_data\FDX\4_2024-06-28.md'
Converted 'data\edgar_documents\FDX\4_2024-07-01' --> 'data\processed_data\FDX\4_2024-07-01.md'


2025-11-14 16:39:09,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:09,594 - INFO - Going to convert document batch...
2025-11-14 16:39:09,596 - INFO - Processing document 4_2024-07-02
2025-11-14 16:39:09,667 - INFO - Finished converting document 4_2024-07-02 in 0.17 sec.
2025-11-14 16:39:09,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:09,801 - INFO - Going to convert document batch...
2025-11-14 16:39:09,802 - INFO - Processing document 4_2024-07-05
2025-11-14 16:39:09,862 - INFO - Finished converting document 4_2024-07-05 in 0.12 sec.


Converted 'data\edgar_documents\FDX\4_2024-07-02' --> 'data\processed_data\FDX\4_2024-07-02.md'
Converted 'data\edgar_documents\FDX\4_2024-07-05' --> 'data\processed_data\FDX\4_2024-07-05.md'


2025-11-14 16:39:10,114 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:10,142 - INFO - Going to convert document batch...
2025-11-14 16:39:10,143 - INFO - Processing document 4_2024-07-11
2025-11-14 16:39:10,209 - INFO - Finished converting document 4_2024-07-11 in 0.28 sec.
2025-11-14 16:39:10,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:10,342 - INFO - Going to convert document batch...
2025-11-14 16:39:10,343 - INFO - Processing document 4_2024-07-18
2025-11-14 16:39:10,398 - INFO - Finished converting document 4_2024-07-18 in 0.12 sec.


Converted 'data\edgar_documents\FDX\4_2024-07-11' --> 'data\processed_data\FDX\4_2024-07-11.md'
Converted 'data\edgar_documents\FDX\4_2024-07-18' --> 'data\processed_data\FDX\4_2024-07-18.md'


2025-11-14 16:39:10,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:10,527 - INFO - Going to convert document batch...
2025-11-14 16:39:10,529 - INFO - Processing document 4_2024-09-24
2025-11-14 16:39:10,577 - INFO - Finished converting document 4_2024-09-24 in 0.12 sec.
2025-11-14 16:39:10,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:10,716 - INFO - Going to convert document batch...
2025-11-14 16:39:10,718 - INFO - Processing document 4_2024-12-23
2025-11-14 16:39:10,769 - INFO - Finished converting document 4_2024-12-23 in 0.14 sec.


Converted 'data\edgar_documents\FDX\4_2024-09-24' --> 'data\processed_data\FDX\4_2024-09-24.md'


2025-11-14 16:39:10,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:10,865 - INFO - Going to convert document batch...
2025-11-14 16:39:10,866 - INFO - Processing document 4_2024-12-26
2025-11-14 16:39:10,935 - INFO - Finished converting document 4_2024-12-26 in 0.11 sec.


Converted 'data\edgar_documents\FDX\4_2024-12-23' --> 'data\processed_data\FDX\4_2024-12-23.md'
Converted 'data\edgar_documents\FDX\4_2024-12-26' --> 'data\processed_data\FDX\4_2024-12-26.md'


2025-11-14 16:39:11,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:11,101 - INFO - Going to convert document batch...
2025-11-14 16:39:11,102 - INFO - Processing document 4_2025-01-06
2025-11-14 16:39:11,172 - INFO - Finished converting document 4_2025-01-06 in 0.17 sec.
2025-11-14 16:39:11,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:11,303 - INFO - Going to convert document batch...
2025-11-14 16:39:11,305 - INFO - Processing document 4_2025-01-08
2025-11-14 16:39:11,367 - INFO - Finished converting document 4_2025-01-08 in 0.12 sec.


Converted 'data\edgar_documents\FDX\4_2025-01-06' --> 'data\processed_data\FDX\4_2025-01-06.md'


2025-11-14 16:39:11,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:11,541 - INFO - Going to convert document batch...
2025-11-14 16:39:11,542 - INFO - Processing document 4_2025-01-10
2025-11-14 16:39:11,642 - INFO - Finished converting document 4_2025-01-10 in 0.20 sec.


Converted 'data\edgar_documents\FDX\4_2025-01-08' --> 'data\processed_data\FDX\4_2025-01-08.md'


2025-11-14 16:39:11,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:11,778 - INFO - Going to convert document batch...
2025-11-14 16:39:11,780 - INFO - Processing document 4_2025-01-14
2025-11-14 16:39:11,856 - INFO - Finished converting document 4_2025-01-14 in 0.14 sec.


Converted 'data\edgar_documents\FDX\4_2025-01-10' --> 'data\processed_data\FDX\4_2025-01-10.md'


2025-11-14 16:39:11,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:12,019 - INFO - Going to convert document batch...
2025-11-14 16:39:12,023 - INFO - Processing document 4_2025-03-24
2025-11-14 16:39:12,095 - INFO - Finished converting document 4_2025-03-24 in 0.16 sec.


Converted 'data\edgar_documents\FDX\4_2025-01-14' --> 'data\processed_data\FDX\4_2025-01-14.md'


2025-11-14 16:39:12,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:12,233 - INFO - Going to convert document batch...
2025-11-14 16:39:12,235 - INFO - Processing document 4_2025-03-27
2025-11-14 16:39:12,313 - INFO - Finished converting document 4_2025-03-27 in 0.14 sec.


Converted 'data\edgar_documents\FDX\4_2025-03-24' --> 'data\processed_data\FDX\4_2025-03-24.md'


2025-11-14 16:39:12,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:12,503 - INFO - Going to convert document batch...
2025-11-14 16:39:12,506 - INFO - Processing document 4_2025-04-11
2025-11-14 16:39:12,601 - INFO - Finished converting document 4_2025-04-11 in 0.19 sec.


Converted 'data\edgar_documents\FDX\4_2025-03-27' --> 'data\processed_data\FDX\4_2025-03-27.md'


2025-11-14 16:39:12,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:12,733 - INFO - Going to convert document batch...
2025-11-14 16:39:12,735 - INFO - Processing document 4_2025-06-27
2025-11-14 16:39:12,802 - INFO - Finished converting document 4_2025-06-27 in 0.11 sec.


Converted 'data\edgar_documents\FDX\4_2025-04-11' --> 'data\processed_data\FDX\4_2025-04-11.md'
Converted 'data\edgar_documents\FDX\4_2025-06-27' --> 'data\processed_data\FDX\4_2025-06-27.md'


2025-11-14 16:39:12,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:12,953 - INFO - Going to convert document batch...
2025-11-14 16:39:12,955 - INFO - Processing document 4_2025-07-07
2025-11-14 16:39:13,038 - INFO - Finished converting document 4_2025-07-07 in 0.17 sec.
2025-11-14 16:39:13,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:13,216 - INFO - Going to convert document batch...
2025-11-14 16:39:13,218 - INFO - Processing document 4_2025-07-08
2025-11-14 16:39:13,296 - INFO - Finished converting document 4_2025-07-08 in 0.17 sec.


Converted 'data\edgar_documents\FDX\4_2025-07-07' --> 'data\processed_data\FDX\4_2025-07-07.md'


2025-11-14 16:39:13,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:13,437 - INFO - Going to convert document batch...
2025-11-14 16:39:13,438 - INFO - Processing document 4_2025-07-09
2025-11-14 16:39:13,506 - INFO - Finished converting document 4_2025-07-09 in 0.11 sec.


Converted 'data\edgar_documents\FDX\4_2025-07-08' --> 'data\processed_data\FDX\4_2025-07-08.md'


2025-11-14 16:39:13,633 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:39:13,634 - ERROR - Input document 4_2025-07-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:39:13,637 - INFO - Going to convert document batch...
2025-11-14 16:39:13,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:13,680 - INFO - Going to convert document batch...
2025-11-14 16:39:13,682 - INFO - Processing document 4_2025-07-23
2025-11-14 16:39:13,744 - INFO - Fin

Converted 'data\edgar_documents\FDX\4_2025-07-09' --> 'data\processed_data\FDX\4_2025-07-09.md'
Error processing data\edgar_documents\FDX\4_2025-07-22: File format not allowed: data\edgar_documents\FDX\4_2025-07-22


2025-11-14 16:39:13,867 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:39:13,868 - ERROR - Input document 4_2025-07-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:39:13,873 - INFO - Going to convert document batch...
2025-11-14 16:39:13,903 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:39:13,905 - ERROR - Input document 4_2025-08-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\FDX\4_2025-07-23' --> 'data\processed_data\FDX\4_2025-07-23.md'
Error processing data\edgar_documents\FDX\4_2025-07-25: File format not allowed: data\edgar_documents\FDX\4_2025-07-25
Error processing data\edgar_documents\FDX\4_2025-08-29: File format not allowed: data\edgar_documents\FDX\4_2025-08-29


2025-11-14 16:39:14,025 - INFO - Finished converting document 4_2025-09-24 in 0.11 sec.
2025-11-14 16:39:14,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:14,183 - INFO - Going to convert document batch...
2025-11-14 16:39:14,185 - INFO - Processing document 4_2025-10-01
2025-11-14 16:39:14,253 - INFO - Finished converting document 4_2025-10-01 in 0.14 sec.


Converted 'data\edgar_documents\FDX\4_2025-09-24' --> 'data\processed_data\FDX\4_2025-09-24.md'


2025-11-14 16:39:14,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:14,387 - INFO - Going to convert document batch...
2025-11-14 16:39:14,388 - INFO - Processing document 4_2025-10-03
2025-11-14 16:39:14,494 - INFO - Finished converting document 4_2025-10-03 in 0.19 sec.


Converted 'data\edgar_documents\FDX\4_2025-10-01' --> 'data\processed_data\FDX\4_2025-10-01.md'


2025-11-14 16:39:14,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:14,662 - INFO - Going to convert document batch...
2025-11-14 16:39:14,664 - INFO - Processing document 8-K_2023-03-06
2025-11-14 16:39:14,751 - INFO - Finished converting document 8-K_2023-03-06 in 0.19 sec.


Converted 'data\edgar_documents\FDX\4_2025-10-03' --> 'data\processed_data\FDX\4_2025-10-03.md'


2025-11-14 16:39:14,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:14,931 - INFO - Going to convert document batch...
2025-11-14 16:39:14,932 - INFO - Processing document 8-K_2023-03-16


Converted 'data\edgar_documents\FDX\8-K_2023-03-06' --> 'data\processed_data\FDX\8-K_2023-03-06.md'


2025-11-14 16:39:15,007 - INFO - Finished converting document 8-K_2023-03-16 in 0.20 sec.
2025-11-14 16:39:15,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:15,136 - INFO - Going to convert document batch...
2025-11-14 16:39:15,138 - INFO - Processing document 8-K_2023-06-20
2025-11-14 16:39:15,204 - INFO - Finished converting document 8-K_2023-06-20 in 0.17 sec.


Converted 'data\edgar_documents\FDX\8-K_2023-03-16' --> 'data\processed_data\FDX\8-K_2023-03-16.md'


2025-11-14 16:39:15,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:15,351 - INFO - Going to convert document batch...
2025-11-14 16:39:15,353 - INFO - Processing document 8-K_2023-07-17


Converted 'data\edgar_documents\FDX\8-K_2023-06-20' --> 'data\processed_data\FDX\8-K_2023-06-20.md'


2025-11-14 16:39:15,484 - INFO - Finished converting document 8-K_2023-07-17 in 0.25 sec.
2025-11-14 16:39:15,550 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:15,588 - INFO - Going to convert document batch...
2025-11-14 16:39:15,590 - INFO - Processing document 8-K_2023-07-31
2025-11-14 16:39:15,650 - INFO - Finished converting document 8-K_2023-07-31 in 0.11 sec.
2025-11-14 16:39:15,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\8-K_2023-07-17' --> 'data\processed_data\FDX\8-K_2023-07-17.md'
Converted 'data\edgar_documents\FDX\8-K_2023-07-31' --> 'data\processed_data\FDX\8-K_2023-07-31.md'


2025-11-14 16:39:15,801 - INFO - Going to convert document batch...
2025-11-14 16:39:15,803 - INFO - Processing document 8-K_2023-09-20
2025-11-14 16:39:15,889 - INFO - Finished converting document 8-K_2023-09-20 in 0.20 sec.
2025-11-14 16:39:15,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:16,054 - INFO - Going to convert document batch...
2025-11-14 16:39:16,056 - INFO - Processing document 8-K_2023-09-22


Converted 'data\edgar_documents\FDX\8-K_2023-09-20' --> 'data\processed_data\FDX\8-K_2023-09-20.md'


2025-11-14 16:39:16,264 - INFO - Finished converting document 8-K_2023-09-22 in 0.34 sec.
2025-11-14 16:39:16,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:16,445 - INFO - Going to convert document batch...
2025-11-14 16:39:16,446 - INFO - Processing document 8-K_2023-10-05
2025-11-14 16:39:16,497 - INFO - Finished converting document 8-K_2023-10-05 in 0.14 sec.


Converted 'data\edgar_documents\FDX\8-K_2023-09-22' --> 'data\processed_data\FDX\8-K_2023-09-22.md'
Converted 'data\edgar_documents\FDX\8-K_2023-10-05' --> 'data\processed_data\FDX\8-K_2023-10-05.md'


2025-11-14 16:39:16,580 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:16,616 - INFO - Going to convert document batch...
2025-11-14 16:39:16,618 - INFO - Processing document 8-K_2023-10-18
2025-11-14 16:39:16,674 - INFO - Finished converting document 8-K_2023-10-18 in 0.16 sec.
2025-11-14 16:39:16,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:16,763 - INFO - Going to convert document batch...
2025-11-14 16:39:16,765 - INFO - Processing document 8-K_2023-12-11
2025-11-14 16:39:16,820 - INFO - Finished converting document 8-K_2023-12-11 in 0.11 sec.
2025-11-14 16:39:16,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\8-K_2023-10-18' --> 'data\processed_data\FDX\8-K_2023-10-18.md'
Converted 'data\edgar_documents\FDX\8-K_2023-12-11' --> 'data\processed_data\FDX\8-K_2023-12-11.md'


2025-11-14 16:39:16,958 - INFO - Going to convert document batch...
2025-11-14 16:39:16,959 - INFO - Processing document 8-K_2023-12-19
2025-11-14 16:39:17,036 - INFO - Finished converting document 8-K_2023-12-19 in 0.19 sec.
2025-11-14 16:39:17,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:17,152 - INFO - Going to convert document batch...
2025-11-14 16:39:17,154 - INFO - Processing document 8-K_2023-12-22
2025-11-14 16:39:17,213 - INFO - Finished converting document 8-K_2023-12-22 in 0.16 sec.


Converted 'data\edgar_documents\FDX\8-K_2023-12-19' --> 'data\processed_data\FDX\8-K_2023-12-19.md'
Converted 'data\edgar_documents\FDX\8-K_2023-12-22' --> 'data\processed_data\FDX\8-K_2023-12-22.md'


2025-11-14 16:39:17,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:17,361 - INFO - Going to convert document batch...
2025-11-14 16:39:17,362 - INFO - Processing document 8-K_2024-03-11
2025-11-14 16:39:17,420 - INFO - Finished converting document 8-K_2024-03-11 in 0.17 sec.
2025-11-14 16:39:17,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:17,561 - INFO - Going to convert document batch...
2025-11-14 16:39:17,563 - INFO - Processing document 8-K_2024-03-21
2025-11-14 16:39:17,628 - INFO - Finished converting document 8-K_2024-03-21 in 0.14 sec.


Converted 'data\edgar_documents\FDX\8-K_2024-03-11' --> 'data\processed_data\FDX\8-K_2024-03-11.md'
Converted 'data\edgar_documents\FDX\8-K_2024-03-21' --> 'data\processed_data\FDX\8-K_2024-03-21.md'


2025-11-14 16:39:17,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:17,752 - INFO - Going to convert document batch...
2025-11-14 16:39:17,755 - INFO - Processing document 8-K_2024-04-01
2025-11-14 16:39:17,815 - INFO - Finished converting document 8-K_2024-04-01 in 0.16 sec.
2025-11-14 16:39:17,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:17,934 - INFO - Going to convert document batch...
2025-11-14 16:39:17,936 - INFO - Processing document 8-K_2024-04-26
2025-11-14 16:39:17,985 - INFO - Finished converting document 8-K_2024-04-26 in 0.14 sec.
2025-11-14 16:39:18,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\8-K_2024-04-01' --> 'data\processed_data\FDX\8-K_2024-04-01.md'
Converted 'data\edgar_documents\FDX\8-K_2024-04-26' --> 'data\processed_data\FDX\8-K_2024-04-26.md'


2025-11-14 16:39:18,493 - INFO - Going to convert document batch...
2025-11-14 16:39:18,494 - INFO - Processing document 8-K_2024-06-12
2025-11-14 16:39:18,564 - INFO - Finished converting document 8-K_2024-06-12 in 0.56 sec.
2025-11-14 16:39:18,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:18,692 - INFO - Going to convert document batch...
2025-11-14 16:39:18,693 - INFO - Processing document 8-K_2024-06-25
2025-11-14 16:39:18,777 - INFO - Finished converting document 8-K_2024-06-25 in 0.19 sec.


Converted 'data\edgar_documents\FDX\8-K_2024-06-12' --> 'data\processed_data\FDX\8-K_2024-06-12.md'


2025-11-14 16:39:18,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:18,924 - INFO - Going to convert document batch...
2025-11-14 16:39:18,925 - INFO - Processing document 8-K_2024-09-03


Converted 'data\edgar_documents\FDX\8-K_2024-06-25' --> 'data\processed_data\FDX\8-K_2024-06-25.md'


2025-11-14 16:39:19,007 - INFO - Finished converting document 8-K_2024-09-03 in 0.20 sec.
2025-11-14 16:39:19,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:19,169 - INFO - Going to convert document batch...
2025-11-14 16:39:19,171 - INFO - Processing document 8-K_2024-09-19


Converted 'data\edgar_documents\FDX\8-K_2024-09-03' --> 'data\processed_data\FDX\8-K_2024-09-03.md'


2025-11-14 16:39:19,249 - INFO - Finished converting document 8-K_2024-09-19 in 0.22 sec.
2025-11-14 16:39:19,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:19,427 - INFO - Going to convert document batch...
2025-11-14 16:39:19,430 - INFO - Processing document 8-K_2024-09-24


Converted 'data\edgar_documents\FDX\8-K_2024-09-19' --> 'data\processed_data\FDX\8-K_2024-09-19.md'


2025-11-14 16:39:19,630 - INFO - Finished converting document 8-K_2024-09-24 in 0.34 sec.
2025-11-14 16:39:19,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:19,796 - INFO - Going to convert document batch...
2025-11-14 16:39:19,797 - INFO - Processing document 8-K_2024-12-19
2025-11-14 16:39:19,874 - INFO - Finished converting document 8-K_2024-12-19 in 0.16 sec.


Converted 'data\edgar_documents\FDX\8-K_2024-09-24' --> 'data\processed_data\FDX\8-K_2024-09-24.md'


2025-11-14 16:39:19,975 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:20,028 - INFO - Going to convert document batch...
2025-11-14 16:39:20,031 - INFO - Processing document 8-K_2025-01-07
2025-11-14 16:39:20,095 - INFO - Finished converting document 8-K_2025-01-07 in 0.19 sec.


Converted 'data\edgar_documents\FDX\8-K_2024-12-19' --> 'data\processed_data\FDX\8-K_2024-12-19.md'


2025-11-14 16:39:20,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:20,236 - INFO - Going to convert document batch...
2025-11-14 16:39:20,237 - INFO - Processing document 8-K_2025-01-23
2025-11-14 16:39:20,314 - INFO - Finished converting document 8-K_2025-01-23 in 0.17 sec.


Converted 'data\edgar_documents\FDX\8-K_2025-01-07' --> 'data\processed_data\FDX\8-K_2025-01-07.md'


2025-11-14 16:39:20,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:20,425 - INFO - Going to convert document batch...
2025-11-14 16:39:20,427 - INFO - Processing document 8-K_2025-01-30
2025-11-14 16:39:20,518 - INFO - Finished converting document 8-K_2025-01-30 in 0.16 sec.


Converted 'data\edgar_documents\FDX\8-K_2025-01-23' --> 'data\processed_data\FDX\8-K_2025-01-23.md'
Converted 'data\edgar_documents\FDX\8-K_2025-01-30' --> 'data\processed_data\FDX\8-K_2025-01-30.md'


2025-11-14 16:39:20,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:20,665 - INFO - Going to convert document batch...
2025-11-14 16:39:20,667 - INFO - Processing document 8-K_2025-02-07
2025-11-14 16:39:20,738 - INFO - Finished converting document 8-K_2025-02-07 in 0.17 sec.
2025-11-14 16:39:20,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:20,956 - INFO - Going to convert document batch...
2025-11-14 16:39:20,958 - INFO - Processing document 8-K_2025-02-26


Converted 'data\edgar_documents\FDX\8-K_2025-02-07' --> 'data\processed_data\FDX\8-K_2025-02-07.md'


2025-11-14 16:39:21,240 - INFO - Finished converting document 8-K_2025-02-26 in 0.45 sec.
2025-11-14 16:39:21,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:21,464 - INFO - Going to convert document batch...
2025-11-14 16:39:21,466 - INFO - Processing document 8-K_2025-03-20
2025-11-14 16:39:21,527 - INFO - Finished converting document 8-K_2025-03-20 in 0.16 sec.


Converted 'data\edgar_documents\FDX\8-K_2025-02-26' --> 'data\processed_data\FDX\8-K_2025-02-26.md'
Converted 'data\edgar_documents\FDX\8-K_2025-03-20' --> 'data\processed_data\FDX\8-K_2025-03-20.md'


2025-11-14 16:39:21,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:21,654 - INFO - Going to convert document batch...
2025-11-14 16:39:21,656 - INFO - Processing document 8-K_2025-05-12
2025-11-14 16:39:21,707 - INFO - Finished converting document 8-K_2025-05-12 in 0.16 sec.
2025-11-14 16:39:21,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:21,812 - INFO - Going to convert document batch...
2025-11-14 16:39:21,814 - INFO - Processing document 8-K_2025-06-23
2025-11-14 16:39:21,864 - INFO - Finished converting document 8-K_2025-06-23 in 0.12 sec.


Converted 'data\edgar_documents\FDX\8-K_2025-05-12' --> 'data\processed_data\FDX\8-K_2025-05-12.md'
Converted 'data\edgar_documents\FDX\8-K_2025-06-23' --> 'data\processed_data\FDX\8-K_2025-06-23.md'


2025-11-14 16:39:21,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:21,988 - INFO - Going to convert document batch...
2025-11-14 16:39:21,990 - INFO - Processing document 8-K_2025-06-24
2025-11-14 16:39:22,074 - INFO - Finished converting document 8-K_2025-06-24 in 0.19 sec.
2025-11-14 16:39:22,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:22,166 - INFO - Going to convert document batch...
2025-11-14 16:39:22,168 - INFO - Processing document 8-K_2025-07-17
2025-11-14 16:39:22,224 - INFO - Finished converting document 8-K_2025-07-17 in 0.11 sec.
2025-11-14 16:39:22,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\8-K_2025-06-24' --> 'data\processed_data\FDX\8-K_2025-06-24.md'
Converted 'data\edgar_documents\FDX\8-K_2025-07-17' --> 'data\processed_data\FDX\8-K_2025-07-17.md'


2025-11-14 16:39:22,331 - INFO - Going to convert document batch...
2025-11-14 16:39:22,332 - INFO - Processing document 8-K_2025-07-24
2025-11-14 16:39:22,402 - INFO - Finished converting document 8-K_2025-07-24 in 0.16 sec.
2025-11-14 16:39:22,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:22,538 - INFO - Going to convert document batch...
2025-11-14 16:39:22,539 - INFO - Processing document 8-K_2025-07-30
2025-11-14 16:39:22,648 - INFO - Finished converting document 8-K_2025-07-30 in 0.20 sec.


Converted 'data\edgar_documents\FDX\8-K_2025-07-24' --> 'data\processed_data\FDX\8-K_2025-07-24.md'


2025-11-14 16:39:22,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:22,810 - INFO - Going to convert document batch...
2025-11-14 16:39:22,812 - INFO - Processing document 8-K_2025-08-12
2025-11-14 16:39:22,876 - INFO - Finished converting document 8-K_2025-08-12 in 0.17 sec.


Converted 'data\edgar_documents\FDX\8-K_2025-07-30' --> 'data\processed_data\FDX\8-K_2025-07-30.md'


2025-11-14 16:39:22,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:22,993 - INFO - Going to convert document batch...
2025-11-14 16:39:22,994 - INFO - Processing document 8-K_2025-09-18
2025-11-14 16:39:23,075 - INFO - Finished converting document 8-K_2025-09-18 in 0.17 sec.


Converted 'data\edgar_documents\FDX\8-K_2025-08-12' --> 'data\processed_data\FDX\8-K_2025-08-12.md'
Converted 'data\edgar_documents\FDX\8-K_2025-09-18' --> 'data\processed_data\FDX\8-K_2025-09-18.md'


2025-11-14 16:39:23,176 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:23,283 - INFO - Going to convert document batch...
2025-11-14 16:39:23,284 - INFO - Processing document 8-K_2025-10-02
2025-11-14 16:39:23,518 - INFO - Finished converting document 8-K_2025-10-02 in 0.39 sec.
2025-11-14 16:39:23,667 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:39:23,740 - INFO - Going to convert document batch...
2025-11-14 16:39:23,742 - INFO - Processing document 8-K_2025-11-06
2025-11-14 16:39:23,801 - INFO - Finished converting document 8-K_2025-11-06 in 0.17 sec.


Converted 'data\edgar_documents\FDX\8-K_2025-10-02' --> 'data\processed_data\FDX\8-K_2025-10-02.md'


2025-11-14 16:39:23,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\8-K_2025-11-06' --> 'data\processed_data\FDX\8-K_2025-11-06.md'


2025-11-14 16:39:26,278 - INFO - Going to convert document batch...
2025-11-14 16:39:26,279 - INFO - Processing document DEF-14A_2023-08-10
2025-11-14 16:40:00,462 - INFO - Finished converting document DEF-14A_2023-08-10 in 36.61 sec.
2025-11-14 16:40:03,833 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\FDX\DEF-14A_2023-08-10' --> 'data\processed_data\FDX\DEF-14A_2023-08-10.md'


2025-11-14 16:40:05,991 - INFO - Going to convert document batch...
2025-11-14 16:40:05,994 - INFO - Processing document DEF-14A_2024-08-12
2025-11-14 16:40:47,166 - INFO - Finished converting document DEF-14A_2024-08-12 in 43.38 sec.
2025-11-14 16:40:51,293 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:40:51,294 - ERROR - Input document DEF-14A_2025-08-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:40:51,300 - INFO - Going to

Converted 'data\edgar_documents\FDX\DEF-14A_2024-08-12' --> 'data\processed_data\FDX\DEF-14A_2024-08-12.md'
Error processing data\edgar_documents\FDX\DEF-14A_2025-08-18: File format not allowed: data\edgar_documents\FDX\DEF-14A_2025-08-18
Processed 99 new files. Errors: 4
Found 106 files to process in data\edgar_documents\GD


2025-11-14 16:40:51,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:40:53,456 - INFO - Going to convert document batch...
2025-11-14 16:40:53,456 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:40:53,458 - INFO - Processing document 10-K_2023-02-07
2025-11-14 16:40:59,980 - INFO - Finished converting document 10-K_2023-02-07 in 8.64 sec.
2025-11-14 16:41:01,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-K_2023-02-07' --> 'data\processed_data\GD\10-K_2023-02-07.md'


2025-11-14 16:41:03,631 - INFO - Going to convert document batch...
2025-11-14 16:41:03,632 - INFO - Processing document 10-K_2024-02-08
2025-11-14 16:41:08,961 - INFO - Finished converting document 10-K_2024-02-08 in 7.31 sec.
2025-11-14 16:41:10,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-K_2024-02-08' --> 'data\processed_data\GD\10-K_2024-02-08.md'


2025-11-14 16:41:12,177 - INFO - Going to convert document batch...
2025-11-14 16:41:12,179 - INFO - Processing document 10-K_2025-02-07
2025-11-14 16:41:16,865 - INFO - Finished converting document 10-K_2025-02-07 in 6.66 sec.
2025-11-14 16:41:18,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-K_2025-02-07' --> 'data\processed_data\GD\10-K_2025-02-07.md'


2025-11-14 16:41:19,739 - INFO - Going to convert document batch...
2025-11-14 16:41:19,740 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 16:41:22,291 - INFO - Finished converting document 10-Q_2023-04-26 in 3.92 sec.
2025-11-14 16:41:23,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-Q_2023-04-26' --> 'data\processed_data\GD\10-Q_2023-04-26.md'


2025-11-14 16:41:24,242 - INFO - Going to convert document batch...
2025-11-14 16:41:24,243 - INFO - Processing document 10-Q_2023-07-26
2025-11-14 16:41:25,729 - INFO - Finished converting document 10-Q_2023-07-26 in 2.72 sec.
2025-11-14 16:41:26,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-Q_2023-07-26' --> 'data\processed_data\GD\10-Q_2023-07-26.md'


2025-11-14 16:41:26,606 - INFO - Going to convert document batch...
2025-11-14 16:41:26,607 - INFO - Processing document 10-Q_2023-10-25
2025-11-14 16:41:28,039 - INFO - Finished converting document 10-Q_2023-10-25 in 1.98 sec.
2025-11-14 16:41:28,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-Q_2023-10-25' --> 'data\processed_data\GD\10-Q_2023-10-25.md'


2025-11-14 16:41:28,819 - INFO - Going to convert document batch...
2025-11-14 16:41:28,820 - INFO - Processing document 10-Q_2024-04-24
2025-11-14 16:41:29,676 - INFO - Finished converting document 10-Q_2024-04-24 in 1.23 sec.
2025-11-14 16:41:30,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-Q_2024-04-24' --> 'data\processed_data\GD\10-Q_2024-04-24.md'


2025-11-14 16:41:30,770 - INFO - Going to convert document batch...
2025-11-14 16:41:30,772 - INFO - Processing document 10-Q_2024-07-24
2025-11-14 16:41:31,806 - INFO - Finished converting document 10-Q_2024-07-24 in 1.73 sec.
2025-11-14 16:41:33,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-Q_2024-07-24' --> 'data\processed_data\GD\10-Q_2024-07-24.md'


2025-11-14 16:41:33,639 - INFO - Going to convert document batch...
2025-11-14 16:41:33,639 - INFO - Processing document 10-Q_2024-10-23
2025-11-14 16:41:34,595 - INFO - Finished converting document 10-Q_2024-10-23 in 1.67 sec.
2025-11-14 16:41:35,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-Q_2024-10-23' --> 'data\processed_data\GD\10-Q_2024-10-23.md'


2025-11-14 16:41:35,480 - INFO - Going to convert document batch...
2025-11-14 16:41:35,481 - INFO - Processing document 10-Q_2025-04-23
2025-11-14 16:41:37,005 - INFO - Finished converting document 10-Q_2025-04-23 in 2.00 sec.
2025-11-14 16:41:37,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-Q_2025-04-23' --> 'data\processed_data\GD\10-Q_2025-04-23.md'


2025-11-14 16:41:38,113 - INFO - Going to convert document batch...
2025-11-14 16:41:38,114 - INFO - Processing document 10-Q_2025-07-23
2025-11-14 16:41:39,178 - INFO - Finished converting document 10-Q_2025-07-23 in 1.81 sec.
2025-11-14 16:41:39,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\10-Q_2025-07-23' --> 'data\processed_data\GD\10-Q_2025-07-23.md'


2025-11-14 16:41:40,782 - INFO - Going to convert document batch...
2025-11-14 16:41:40,783 - INFO - Processing document 10-Q_2025-10-24
2025-11-14 16:41:42,125 - INFO - Finished converting document 10-Q_2025-10-24 in 2.42 sec.
2025-11-14 16:41:42,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:42,712 - INFO - Going to convert document batch...
2025-11-14 16:41:42,713 - INFO - Processing document 4_2023-01-31
2025-11-14 16:41:42,748 - INFO - Finished converting document 4_2023-01-31 in 0.22 sec.


Converted 'data\edgar_documents\GD\10-Q_2025-10-24' --> 'data\processed_data\GD\10-Q_2025-10-24.md'


2025-11-14 16:41:42,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:42,813 - INFO - Going to convert document batch...
2025-11-14 16:41:42,814 - INFO - Processing document 4_2023-02-14
2025-11-14 16:41:42,845 - INFO - Finished converting document 4_2023-02-14 in 0.06 sec.
2025-11-14 16:41:42,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:42,916 - INFO - Going to convert document batch...
2025-11-14 16:41:42,916 - INFO - Processing document 4_2023-03-08
2025-11-14 16:41:42,939 - INFO - Finished converting document 4_2023-03-08 in 0.06 sec.
2025-11-14 16:41:42,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\4_2023-01-31' --> 'data\processed_data\GD\4_2023-01-31.md'
Converted 'data\edgar_documents\GD\4_2023-02-14' --> 'data\processed_data\GD\4_2023-02-14.md'
Converted 'data\edgar_documents\GD\4_2023-03-08' --> 'data\processed_data\GD\4_2023-03-08.md'


2025-11-14 16:41:42,987 - INFO - Going to convert document batch...
2025-11-14 16:41:42,988 - INFO - Processing document 4_2023-03-09
2025-11-14 16:41:43,079 - INFO - Finished converting document 4_2023-03-09 in 0.12 sec.
2025-11-14 16:41:43,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,144 - INFO - Going to convert document batch...
2025-11-14 16:41:43,144 - INFO - Processing document 4_2023-03-10
2025-11-14 16:41:43,171 - INFO - Finished converting document 4_2023-03-10 in 0.06 sec.
2025-11-14 16:41:43,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,229 - INFO - Going to convert document batch...
2025-11-14 16:41:43,230 - INFO - Processing document 4_2023-03-20
2025-11-14 16:41:43,253 - INFO - Finished converting document 4_2023-03-20 in 0.05 sec.
2025-11-14 16:41:43,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\4_2023-03-09' --> 'data\processed_data\GD\4_2023-03-09.md'
Converted 'data\edgar_documents\GD\4_2023-03-10' --> 'data\processed_data\GD\4_2023-03-10.md'
Converted 'data\edgar_documents\GD\4_2023-03-20' --> 'data\processed_data\GD\4_2023-03-20.md'


2025-11-14 16:41:43,323 - INFO - Going to convert document batch...
2025-11-14 16:41:43,324 - INFO - Processing document 4_2023-05-04
2025-11-14 16:41:43,360 - INFO - Finished converting document 4_2023-05-04 in 0.08 sec.
2025-11-14 16:41:43,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,409 - INFO - Going to convert document batch...
2025-11-14 16:41:43,411 - INFO - Processing document 4_2023-05-16
2025-11-14 16:41:43,434 - INFO - Finished converting document 4_2023-05-16 in 0.05 sec.
2025-11-14 16:41:43,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,499 - INFO - Going to convert document batch...
2025-11-14 16:41:43,500 - INFO - Processing document 4_2023-06-20
2025-11-14 16:41:43,525 - INFO - Finished converting document 4_2023-06-20 in 0.05 sec.
2025-11-14 16:41:43,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,577 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GD\4_2023-05-04' --> 'data\processed_data\GD\4_2023-05-04.md'
Converted 'data\edgar_documents\GD\4_2023-05-16' --> 'data\processed_data\GD\4_2023-05-16.md'
Converted 'data\edgar_documents\GD\4_2023-06-20' --> 'data\processed_data\GD\4_2023-06-20.md'


2025-11-14 16:41:43,578 - INFO - Processing document 4_2023-08-07
2025-11-14 16:41:43,599 - INFO - Finished converting document 4_2023-08-07 in 0.05 sec.
2025-11-14 16:41:43,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,652 - INFO - Going to convert document batch...
2025-11-14 16:41:43,653 - INFO - Processing document 4_2023-08-15
2025-11-14 16:41:43,680 - INFO - Finished converting document 4_2023-08-15 in 0.05 sec.
2025-11-14 16:41:43,716 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,730 - INFO - Going to convert document batch...
2025-11-14 16:41:43,731 - INFO - Processing document 4_2023-08-16
2025-11-14 16:41:43,754 - INFO - Finished converting document 4_2023-08-16 in 0.05 sec.
2025-11-14 16:41:43,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,798 - INFO - Going to convert document batch...
2025-11-14 16:41:43,799 - INFO - Processing document 4_2023-09-20


Converted 'data\edgar_documents\GD\4_2023-08-07' --> 'data\processed_data\GD\4_2023-08-07.md'
Converted 'data\edgar_documents\GD\4_2023-08-15' --> 'data\processed_data\GD\4_2023-08-15.md'
Converted 'data\edgar_documents\GD\4_2023-08-16' --> 'data\processed_data\GD\4_2023-08-16.md'


2025-11-14 16:41:43,827 - INFO - Finished converting document 4_2023-09-20 in 0.05 sec.
2025-11-14 16:41:43,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,882 - INFO - Going to convert document batch...
2025-11-14 16:41:43,883 - INFO - Processing document 4_2023-10-31
2025-11-14 16:41:43,908 - INFO - Finished converting document 4_2023-10-31 in 0.06 sec.
2025-11-14 16:41:43,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:43,954 - INFO - Going to convert document batch...
2025-11-14 16:41:43,956 - INFO - Processing document 4_2023-11-01
2025-11-14 16:41:43,982 - INFO - Finished converting document 4_2023-11-01 in 0.06 sec.
2025-11-14 16:41:44,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:44,025 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GD\4_2023-09-20' --> 'data\processed_data\GD\4_2023-09-20.md'
Converted 'data\edgar_documents\GD\4_2023-10-31' --> 'data\processed_data\GD\4_2023-10-31.md'
Converted 'data\edgar_documents\GD\4_2023-11-01' --> 'data\processed_data\GD\4_2023-11-01.md'


2025-11-14 16:41:44,026 - INFO - Processing document 4_2023-11-14
2025-11-14 16:41:44,046 - INFO - Finished converting document 4_2023-11-14 in 0.05 sec.
2025-11-14 16:41:44,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:44,108 - INFO - Going to convert document batch...
2025-11-14 16:41:44,109 - INFO - Processing document 4_2023-12-20
2025-11-14 16:41:44,129 - INFO - Finished converting document 4_2023-12-20 in 0.05 sec.
2025-11-14 16:41:44,161 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:44,175 - INFO - Going to convert document batch...
2025-11-14 16:41:44,175 - INFO - Processing document 4_2024-01-30
2025-11-14 16:41:44,202 - INFO - Finished converting document 4_2024-01-30 in 0.06 sec.
2025-11-14 16:41:44,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:44,267 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GD\4_2023-11-14' --> 'data\processed_data\GD\4_2023-11-14.md'
Converted 'data\edgar_documents\GD\4_2023-12-20' --> 'data\processed_data\GD\4_2023-12-20.md'
Converted 'data\edgar_documents\GD\4_2024-01-30' --> 'data\processed_data\GD\4_2024-01-30.md'


2025-11-14 16:41:44,268 - INFO - Processing document 4_2024-02-01
2025-11-14 16:41:44,299 - INFO - Finished converting document 4_2024-02-01 in 0.06 sec.
2025-11-14 16:41:44,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:44,454 - INFO - Going to convert document batch...
2025-11-14 16:41:44,454 - INFO - Processing document 4_2024-02-13
2025-11-14 16:41:44,478 - INFO - Finished converting document 4_2024-02-13 in 0.14 sec.
2025-11-14 16:41:44,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\4_2024-02-01' --> 'data\processed_data\GD\4_2024-02-01.md'
Converted 'data\edgar_documents\GD\4_2024-02-13' --> 'data\processed_data\GD\4_2024-02-13.md'


2025-11-14 16:41:44,535 - INFO - Going to convert document batch...
2025-11-14 16:41:44,536 - INFO - Processing document 4_2024-03-05
2025-11-14 16:41:44,565 - INFO - Finished converting document 4_2024-03-05 in 0.06 sec.
2025-11-14 16:41:44,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:44,615 - INFO - Going to convert document batch...
2025-11-14 16:41:44,616 - INFO - Processing document 4_2024-03-06
2025-11-14 16:41:44,636 - INFO - Finished converting document 4_2024-03-06 in 0.05 sec.
2025-11-14 16:41:44,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:44,700 - INFO - Going to convert document batch...
2025-11-14 16:41:44,701 - INFO - Processing document 4_2024-03-07
2025-11-14 16:41:44,742 - INFO - Finished converting document 4_2024-03-07 in 0.08 sec.
2025-11-14 16:41:44,777 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\4_2024-03-05' --> 'data\processed_data\GD\4_2024-03-05.md'
Converted 'data\edgar_documents\GD\4_2024-03-06' --> 'data\processed_data\GD\4_2024-03-06.md'
Converted 'data\edgar_documents\GD\4_2024-03-07' --> 'data\processed_data\GD\4_2024-03-07.md'


2025-11-14 16:41:44,786 - INFO - Going to convert document batch...
2025-11-14 16:41:44,787 - INFO - Processing document 4_2024-03-20
2025-11-14 16:41:44,819 - INFO - Finished converting document 4_2024-03-20 in 0.05 sec.
2025-11-14 16:41:44,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:44,982 - INFO - Going to convert document batch...
2025-11-14 16:41:44,984 - INFO - Processing document 4_2024-04-05
2025-11-14 16:41:45,018 - INFO - Finished converting document 4_2024-04-05 in 0.08 sec.
2025-11-14 16:41:45,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:45,063 - INFO - Going to convert document batch...
2025-11-14 16:41:45,064 - INFO - Processing document 4_2024-04-30
2025-11-14 16:41:45,083 - INFO - Finished converting document 4_2024-04-30 in 0.03 sec.
2025-11-14 16:41:45,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:45,131 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GD\4_2024-03-20' --> 'data\processed_data\GD\4_2024-03-20.md'
Converted 'data\edgar_documents\GD\4_2024-04-05' --> 'data\processed_data\GD\4_2024-04-05.md'
Converted 'data\edgar_documents\GD\4_2024-04-30' --> 'data\processed_data\GD\4_2024-04-30.md'


2025-11-14 16:41:45,132 - INFO - Processing document 4_2024-05-03
2025-11-14 16:41:45,177 - INFO - Finished converting document 4_2024-05-03 in 0.06 sec.
2025-11-14 16:41:45,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:45,243 - INFO - Going to convert document batch...
2025-11-14 16:41:45,244 - INFO - Processing document 4_2024-05-07
2025-11-14 16:41:45,269 - INFO - Finished converting document 4_2024-05-07 in 0.06 sec.
2025-11-14 16:41:45,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:45,316 - INFO - Going to convert document batch...
2025-11-14 16:41:45,317 - INFO - Processing document 4_2024-05-13
2025-11-14 16:41:45,343 - INFO - Finished converting document 4_2024-05-13 in 0.05 sec.
2025-11-14 16:41:45,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:45,397 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GD\4_2024-05-03' --> 'data\processed_data\GD\4_2024-05-03.md'
Converted 'data\edgar_documents\GD\4_2024-05-07' --> 'data\processed_data\GD\4_2024-05-07.md'
Converted 'data\edgar_documents\GD\4_2024-05-13' --> 'data\processed_data\GD\4_2024-05-13.md'


2025-11-14 16:41:45,398 - INFO - Processing document 4_2024-05-15
2025-11-14 16:41:45,433 - INFO - Finished converting document 4_2024-05-15 in 0.08 sec.
2025-11-14 16:41:45,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:45,618 - INFO - Going to convert document batch...
2025-11-14 16:41:45,619 - INFO - Processing document 4_2024-05-21
2025-11-14 16:41:45,656 - INFO - Finished converting document 4_2024-05-21 in 0.11 sec.
2025-11-14 16:41:45,698 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:45,715 - INFO - Going to convert document batch...
2025-11-14 16:41:45,716 - INFO - Processing document 4_2024-05-22


Converted 'data\edgar_documents\GD\4_2024-05-15' --> 'data\processed_data\GD\4_2024-05-15.md'
Converted 'data\edgar_documents\GD\4_2024-05-21' --> 'data\processed_data\GD\4_2024-05-21.md'


2025-11-14 16:41:45,754 - INFO - Finished converting document 4_2024-05-22 in 0.06 sec.
2025-11-14 16:41:45,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:45,845 - INFO - Going to convert document batch...
2025-11-14 16:41:45,846 - INFO - Processing document 4_2024-06-21
2025-11-14 16:41:45,870 - INFO - Finished converting document 4_2024-06-21 in 0.06 sec.
2025-11-14 16:41:45,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:45,927 - INFO - Going to convert document batch...
2025-11-14 16:41:45,928 - INFO - Processing document 4_2024-09-18
2025-11-14 16:41:45,950 - INFO - Finished converting document 4_2024-09-18 in 0.06 sec.
2025-11-14 16:41:46,004 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\4_2024-05-22' --> 'data\processed_data\GD\4_2024-05-22.md'
Converted 'data\edgar_documents\GD\4_2024-06-21' --> 'data\processed_data\GD\4_2024-06-21.md'
Converted 'data\edgar_documents\GD\4_2024-09-18' --> 'data\processed_data\GD\4_2024-09-18.md'


2025-11-14 16:41:46,015 - INFO - Going to convert document batch...
2025-11-14 16:41:46,015 - INFO - Processing document 4_2024-09-19
2025-11-14 16:41:46,041 - INFO - Finished converting document 4_2024-09-19 in 0.08 sec.
2025-11-14 16:41:46,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:46,110 - INFO - Going to convert document batch...
2025-11-14 16:41:46,113 - INFO - Processing document 4_2024-10-30
2025-11-14 16:41:46,141 - INFO - Finished converting document 4_2024-10-30 in 0.06 sec.
2025-11-14 16:41:46,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:46,182 - INFO - Going to convert document batch...
2025-11-14 16:41:46,183 - INFO - Processing document 4_2024-10-31
2025-11-14 16:41:46,203 - INFO - Finished converting document 4_2024-10-31 in 0.05 sec.
2025-11-14 16:41:46,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:46,248 - INFO - Going to convert document batch...
2025-11-14 16:41:46,249 - 

Converted 'data\edgar_documents\GD\4_2024-09-19' --> 'data\processed_data\GD\4_2024-09-19.md'
Converted 'data\edgar_documents\GD\4_2024-10-30' --> 'data\processed_data\GD\4_2024-10-30.md'
Converted 'data\edgar_documents\GD\4_2024-10-31' --> 'data\processed_data\GD\4_2024-10-31.md'


2025-11-14 16:41:46,273 - INFO - Finished converting document 4_2024-11-26 in 0.05 sec.
2025-11-14 16:41:46,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:46,319 - INFO - Going to convert document batch...
2025-11-14 16:41:46,319 - INFO - Processing document 4_2024-12-19
2025-11-14 16:41:46,418 - INFO - Finished converting document 4_2024-12-19 in 0.12 sec.


Converted 'data\edgar_documents\GD\4_2024-11-26' --> 'data\processed_data\GD\4_2024-11-26.md'
Converted 'data\edgar_documents\GD\4_2024-12-19' --> 'data\processed_data\GD\4_2024-12-19.md'


2025-11-14 16:41:46,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:46,519 - INFO - Going to convert document batch...
2025-11-14 16:41:46,521 - INFO - Processing document 4_2025-02-04
2025-11-14 16:41:46,562 - INFO - Finished converting document 4_2025-02-04 in 0.11 sec.
2025-11-14 16:41:46,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:46,662 - INFO - Going to convert document batch...
2025-11-14 16:41:46,663 - INFO - Processing document 4_2025-02-06
2025-11-14 16:41:46,697 - INFO - Finished converting document 4_2025-02-06 in 0.09 sec.
2025-11-14 16:41:46,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:46,756 - INFO - Going to convert document batch...
2025-11-14 16:41:46,757 - INFO - Processing document 4_2025-03-05
2025-11-14 16:41:46,777 - INFO - Finished converting document 4_2025-03-05 in 0.05 sec.


Converted 'data\edgar_documents\GD\4_2025-02-04' --> 'data\processed_data\GD\4_2025-02-04.md'
Converted 'data\edgar_documents\GD\4_2025-02-06' --> 'data\processed_data\GD\4_2025-02-06.md'


2025-11-14 16:41:46,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:46,831 - INFO - Going to convert document batch...
2025-11-14 16:41:46,831 - INFO - Processing document 4_2025-03-06
2025-11-14 16:41:46,864 - INFO - Finished converting document 4_2025-03-06 in 0.06 sec.
2025-11-14 16:41:46,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:46,932 - INFO - Going to convert document batch...
2025-11-14 16:41:46,932 - INFO - Processing document 4_2025-03-12
2025-11-14 16:41:46,962 - INFO - Finished converting document 4_2025-03-12 in 0.06 sec.


Converted 'data\edgar_documents\GD\4_2025-03-05' --> 'data\processed_data\GD\4_2025-03-05.md'
Converted 'data\edgar_documents\GD\4_2025-03-06' --> 'data\processed_data\GD\4_2025-03-06.md'
Converted 'data\edgar_documents\GD\4_2025-03-12' --> 'data\processed_data\GD\4_2025-03-12.md'


2025-11-14 16:41:47,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:47,024 - INFO - Going to convert document batch...
2025-11-14 16:41:47,024 - INFO - Processing document 4_2025-03-20
2025-11-14 16:41:47,125 - INFO - Finished converting document 4_2025-03-20 in 0.14 sec.
2025-11-14 16:41:47,228 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:41:47,230 - ERROR - Input document 4_2025-04-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:41

Converted 'data\edgar_documents\GD\4_2025-03-20' --> 'data\processed_data\GD\4_2025-03-20.md'
Error processing data\edgar_documents\GD\4_2025-04-28: File format not allowed: data\edgar_documents\GD\4_2025-04-28
Error processing data\edgar_documents\GD\4_2025-04-30: File format not allowed: data\edgar_documents\GD\4_2025-04-30
Converted 'data\edgar_documents\GD\4_2025-05-07' --> 'data\processed_data\GD\4_2025-05-07.md'


2025-11-14 16:41:47,361 - INFO - Going to convert document batch...
2025-11-14 16:41:47,362 - INFO - Processing document 4_2025-05-15
2025-11-14 16:41:47,406 - INFO - Finished converting document 4_2025-05-15 in 0.08 sec.
2025-11-14 16:41:47,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:47,462 - INFO - Going to convert document batch...
2025-11-14 16:41:47,463 - INFO - Processing document 4_2025-06-17
2025-11-14 16:41:47,496 - INFO - Finished converting document 4_2025-06-17 in 0.06 sec.
2025-11-14 16:41:47,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:47,568 - INFO - Going to convert document batch...
2025-11-14 16:41:47,569 - INFO - Processing document 4_2025-06-20
2025-11-14 16:41:47,610 - INFO - Finished converting document 4_2025-06-20 in 0.09 sec.
2025-11-14 16:41:47,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\4_2025-05-15' --> 'data\processed_data\GD\4_2025-05-15.md'
Converted 'data\edgar_documents\GD\4_2025-06-17' --> 'data\processed_data\GD\4_2025-06-17.md'
Converted 'data\edgar_documents\GD\4_2025-06-20' --> 'data\processed_data\GD\4_2025-06-20.md'


2025-11-14 16:41:47,657 - INFO - Going to convert document batch...
2025-11-14 16:41:47,658 - INFO - Processing document 4_2025-07-29
2025-11-14 16:41:47,686 - INFO - Finished converting document 4_2025-07-29 in 0.06 sec.
2025-11-14 16:41:47,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:47,750 - INFO - Going to convert document batch...
2025-11-14 16:41:47,751 - INFO - Processing document 4_2025-08-06
2025-11-14 16:41:47,787 - INFO - Finished converting document 4_2025-08-06 in 0.08 sec.
2025-11-14 16:41:47,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:47,862 - INFO - Going to convert document batch...
2025-11-14 16:41:47,863 - INFO - Processing document 4_2025-08-12
2025-11-14 16:41:47,891 - INFO - Finished converting document 4_2025-08-12 in 0.08 sec.


Converted 'data\edgar_documents\GD\4_2025-07-29' --> 'data\processed_data\GD\4_2025-07-29.md'
Converted 'data\edgar_documents\GD\4_2025-08-06' --> 'data\processed_data\GD\4_2025-08-06.md'


2025-11-14 16:41:47,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:47,948 - INFO - Going to convert document batch...
2025-11-14 16:41:47,949 - INFO - Processing document 4_2025-08-18
2025-11-14 16:41:47,984 - INFO - Finished converting document 4_2025-08-18 in 0.08 sec.
2025-11-14 16:41:48,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:48,046 - INFO - Going to convert document batch...
2025-11-14 16:41:48,047 - INFO - Processing document 4_2025-08-20
2025-11-14 16:41:48,076 - INFO - Finished converting document 4_2025-08-20 in 0.06 sec.


Converted 'data\edgar_documents\GD\4_2025-08-12' --> 'data\processed_data\GD\4_2025-08-12.md'
Converted 'data\edgar_documents\GD\4_2025-08-18' --> 'data\processed_data\GD\4_2025-08-18.md'


2025-11-14 16:41:48,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:48,142 - INFO - Going to convert document batch...
2025-11-14 16:41:48,197 - INFO - Processing document 4_2025-08-26
2025-11-14 16:41:48,250 - INFO - Finished converting document 4_2025-08-26 in 0.16 sec.


Converted 'data\edgar_documents\GD\4_2025-08-20' --> 'data\processed_data\GD\4_2025-08-20.md'
Converted 'data\edgar_documents\GD\4_2025-08-26' --> 'data\processed_data\GD\4_2025-08-26.md'


2025-11-14 16:41:48,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:48,345 - INFO - Going to convert document batch...
2025-11-14 16:41:48,346 - INFO - Processing document 4_2025-08-27
2025-11-14 16:41:48,373 - INFO - Finished converting document 4_2025-08-27 in 0.09 sec.
2025-11-14 16:41:48,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:48,427 - INFO - Going to convert document batch...
2025-11-14 16:41:48,428 - INFO - Processing document 4_2025-09-08
2025-11-14 16:41:48,448 - INFO - Finished converting document 4_2025-09-08 in 0.05 sec.
2025-11-14 16:41:48,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:48,493 - INFO - Going to convert document batch...
2025-11-14 16:41:48,494 - INFO - Processing document 4_2025-09-10
2025-11-14 16:41:48,514 - INFO - Finished converting document 4_2025-09-10 in 0.05 sec.
2025-11-14 16:41:48,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GD\4_2025-08-27' --> 'data\processed_data\GD\4_2025-08-27.md'
Converted 'data\edgar_documents\GD\4_2025-09-08' --> 'data\processed_data\GD\4_2025-09-08.md'
Converted 'data\edgar_documents\GD\4_2025-09-10' --> 'data\processed_data\GD\4_2025-09-10.md'


2025-11-14 16:41:48,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:48,642 - INFO - Going to convert document batch...
2025-11-14 16:41:48,679 - INFO - Processing document 4_2025-09-18
2025-11-14 16:41:48,746 - INFO - Finished converting document 4_2025-09-18 in 0.14 sec.
2025-11-14 16:41:48,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\4_2025-09-16' --> 'data\processed_data\GD\4_2025-09-16.md'
Converted 'data\edgar_documents\GD\4_2025-09-18' --> 'data\processed_data\GD\4_2025-09-18.md'


2025-11-14 16:41:48,807 - INFO - Going to convert document batch...
2025-11-14 16:41:48,808 - INFO - Processing document 4_2025-10-30
2025-11-14 16:41:48,843 - INFO - Finished converting document 4_2025-10-30 in 0.08 sec.
2025-11-14 16:41:48,888 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:48,897 - INFO - Going to convert document batch...
2025-11-14 16:41:48,897 - INFO - Processing document 4_2025-11-07


Converted 'data\edgar_documents\GD\4_2025-10-30' --> 'data\processed_data\GD\4_2025-10-30.md'


2025-11-14 16:41:49,390 - INFO - Finished converting document 4_2025-11-07 in 0.52 sec.
2025-11-14 16:41:49,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:49,485 - INFO - Going to convert document batch...
2025-11-14 16:41:49,486 - INFO - Processing document 8-K_2023-01-25
2025-11-14 16:41:49,507 - INFO - Finished converting document 8-K_2023-01-25 in 0.09 sec.
2025-11-14 16:41:49,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:49,547 - INFO - Going to convert document batch...
2025-11-14 16:41:49,548 - INFO - Processing document 8-K_2023-02-06
2025-11-14 16:41:49,566 - INFO - Finished converting document 8-K_2023-02-06 in 0.05 sec.
2025-11-14 16:41:49,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\4_2025-11-07' --> 'data\processed_data\GD\4_2025-11-07.md'
Converted 'data\edgar_documents\GD\8-K_2023-01-25' --> 'data\processed_data\GD\8-K_2023-01-25.md'
Converted 'data\edgar_documents\GD\8-K_2023-02-06' --> 'data\processed_data\GD\8-K_2023-02-06.md'


2025-11-14 16:41:49,611 - INFO - Going to convert document batch...
2025-11-14 16:41:49,612 - INFO - Processing document 8-K_2023-04-26
2025-11-14 16:41:49,710 - INFO - Finished converting document 8-K_2023-04-26 in 0.12 sec.
2025-11-14 16:41:49,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:49,820 - INFO - Going to convert document batch...
2025-11-14 16:41:49,822 - INFO - Processing document 8-K_2023-05-05
2025-11-14 16:41:49,886 - INFO - Finished converting document 8-K_2023-05-05 in 0.16 sec.


Converted 'data\edgar_documents\GD\8-K_2023-04-26' --> 'data\processed_data\GD\8-K_2023-04-26.md'


2025-11-14 16:41:49,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:49,988 - INFO - Going to convert document batch...
2025-11-14 16:41:49,989 - INFO - Processing document 8-K_2023-06-08
2025-11-14 16:41:50,008 - INFO - Finished converting document 8-K_2023-06-08 in 0.08 sec.
2025-11-14 16:41:50,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:50,055 - INFO - Going to convert document batch...
2025-11-14 16:41:50,056 - INFO - Processing document 8-K_2023-07-26
2025-11-14 16:41:50,076 - INFO - Finished converting document 8-K_2023-07-26 in 0.05 sec.
2025-11-14 16:41:50,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\8-K_2023-05-05' --> 'data\processed_data\GD\8-K_2023-05-05.md'
Converted 'data\edgar_documents\GD\8-K_2023-06-08' --> 'data\processed_data\GD\8-K_2023-06-08.md'
Converted 'data\edgar_documents\GD\8-K_2023-07-26' --> 'data\processed_data\GD\8-K_2023-07-26.md'


2025-11-14 16:41:50,134 - INFO - Going to convert document batch...
2025-11-14 16:41:50,135 - INFO - Processing document 8-K_2023-08-30
2025-11-14 16:41:50,177 - INFO - Finished converting document 8-K_2023-08-30 in 0.08 sec.
2025-11-14 16:41:50,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:50,316 - INFO - Going to convert document batch...
2025-11-14 16:41:50,317 - INFO - Processing document 8-K_2023-10-05
2025-11-14 16:41:50,335 - INFO - Finished converting document 8-K_2023-10-05 in 0.14 sec.
2025-11-14 16:41:50,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\8-K_2023-08-30' --> 'data\processed_data\GD\8-K_2023-08-30.md'
Converted 'data\edgar_documents\GD\8-K_2023-10-05' --> 'data\processed_data\GD\8-K_2023-10-05.md'


2025-11-14 16:41:50,401 - INFO - Going to convert document batch...
2025-11-14 16:41:50,402 - INFO - Processing document 8-K_2023-10-25
2025-11-14 16:41:50,426 - INFO - Finished converting document 8-K_2023-10-25 in 0.08 sec.
2025-11-14 16:41:50,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:50,475 - INFO - Going to convert document batch...
2025-11-14 16:41:50,476 - INFO - Processing document 8-K_2024-01-05
2025-11-14 16:41:50,498 - INFO - Finished converting document 8-K_2024-01-05 in 0.06 sec.
2025-11-14 16:41:50,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:50,553 - INFO - Going to convert document batch...
2025-11-14 16:41:50,554 - INFO - Processing document 8-K_2024-01-24
2025-11-14 16:41:50,572 - INFO - Finished converting document 8-K_2024-01-24 in 0.05 sec.
2025-11-14 16:41:50,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:50,608 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\GD\8-K_2023-10-25' --> 'data\processed_data\GD\8-K_2023-10-25.md'
Converted 'data\edgar_documents\GD\8-K_2024-01-05' --> 'data\processed_data\GD\8-K_2024-01-05.md'
Converted 'data\edgar_documents\GD\8-K_2024-01-24' --> 'data\processed_data\GD\8-K_2024-01-24.md'


2025-11-14 16:41:50,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:50,663 - INFO - Going to convert document batch...
2025-11-14 16:41:50,664 - INFO - Processing document 8-K_2024-03-07
2025-11-14 16:41:50,689 - INFO - Finished converting document 8-K_2024-03-07 in 0.05 sec.
2025-11-14 16:41:50,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:50,792 - INFO - Going to convert document batch...
2025-11-14 16:41:50,793 - INFO - Processing document 8-K_2024-04-24
2025-11-14 16:41:50,823 - INFO - Finished converting document 8-K_2024-04-24 in 0.12 sec.


Converted 'data\edgar_documents\GD\8-K_2024-02-13' --> 'data\processed_data\GD\8-K_2024-02-13.md'
Converted 'data\edgar_documents\GD\8-K_2024-03-07' --> 'data\processed_data\GD\8-K_2024-03-07.md'


2025-11-14 16:41:50,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:50,892 - INFO - Going to convert document batch...
2025-11-14 16:41:50,893 - INFO - Processing document 8-K_2024-05-03
2025-11-14 16:41:50,939 - INFO - Finished converting document 8-K_2024-05-03 in 0.11 sec.
2025-11-14 16:41:51,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\8-K_2024-04-24' --> 'data\processed_data\GD\8-K_2024-04-24.md'
Converted 'data\edgar_documents\GD\8-K_2024-05-03' --> 'data\processed_data\GD\8-K_2024-05-03.md'


2025-11-14 16:41:51,043 - INFO - Going to convert document batch...
2025-11-14 16:41:51,045 - INFO - Processing document 8-K_2024-07-24
2025-11-14 16:41:51,067 - INFO - Finished converting document 8-K_2024-07-24 in 0.09 sec.
2025-11-14 16:41:51,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:51,118 - INFO - Going to convert document batch...
2025-11-14 16:41:51,173 - INFO - Processing document 8-K_2024-08-08
2025-11-14 16:41:51,231 - INFO - Finished converting document 8-K_2024-08-08 in 0.16 sec.
2025-11-14 16:41:51,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\8-K_2024-07-24' --> 'data\processed_data\GD\8-K_2024-07-24.md'
Converted 'data\edgar_documents\GD\8-K_2024-08-08' --> 'data\processed_data\GD\8-K_2024-08-08.md'


2025-11-14 16:41:51,301 - INFO - Going to convert document batch...
2025-11-14 16:41:51,302 - INFO - Processing document 8-K_2024-10-23
2025-11-14 16:41:51,334 - INFO - Finished converting document 8-K_2024-10-23 in 0.08 sec.
2025-11-14 16:41:51,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:51,374 - INFO - Going to convert document batch...
2025-11-14 16:41:51,375 - INFO - Processing document 8-K_2024-12-16
2025-11-14 16:41:51,392 - INFO - Finished converting document 8-K_2024-12-16 in 0.05 sec.
2025-11-14 16:41:51,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:51,427 - INFO - Going to convert document batch...
2025-11-14 16:41:51,430 - INFO - Processing document 8-K_2025-01-29
2025-11-14 16:41:51,451 - INFO - Finished converting document 8-K_2025-01-29 in 0.05 sec.
2025-11-14 16:41:51,481 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:51,493 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\GD\8-K_2024-10-23' --> 'data\processed_data\GD\8-K_2024-10-23.md'
Converted 'data\edgar_documents\GD\8-K_2024-12-16' --> 'data\processed_data\GD\8-K_2024-12-16.md'
Converted 'data\edgar_documents\GD\8-K_2025-01-29' --> 'data\processed_data\GD\8-K_2025-01-29.md'


2025-11-14 16:41:51,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:51,554 - INFO - Going to convert document batch...
2025-11-14 16:41:51,555 - INFO - Processing document 8-K_2025-05-07
2025-11-14 16:41:51,580 - INFO - Finished converting document 8-K_2025-05-07 in 0.05 sec.
2025-11-14 16:41:51,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\8-K_2025-04-23' --> 'data\processed_data\GD\8-K_2025-04-23.md'
Converted 'data\edgar_documents\GD\8-K_2025-05-07' --> 'data\processed_data\GD\8-K_2025-05-07.md'


2025-11-14 16:41:51,744 - INFO - Going to convert document batch...
2025-11-14 16:41:51,745 - INFO - Processing document 8-K_2025-05-09
2025-11-14 16:41:51,807 - INFO - Finished converting document 8-K_2025-05-09 in 0.22 sec.
2025-11-14 16:41:51,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:51,908 - INFO - Going to convert document batch...
2025-11-14 16:41:51,908 - INFO - Processing document 8-K_2025-06-04
2025-11-14 16:41:51,926 - INFO - Finished converting document 8-K_2025-06-04 in 0.08 sec.
2025-11-14 16:41:51,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:51,969 - INFO - Going to convert document batch...
2025-11-14 16:41:51,969 - INFO - Processing document 8-K_2025-06-09
2025-11-14 16:41:51,986 - INFO - Finished converting document 8-K_2025-06-09 in 0.05 sec.
2025-11-14 16:41:52,013 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:52,023 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\GD\8-K_2025-05-09' --> 'data\processed_data\GD\8-K_2025-05-09.md'
Converted 'data\edgar_documents\GD\8-K_2025-06-04' --> 'data\processed_data\GD\8-K_2025-06-04.md'
Converted 'data\edgar_documents\GD\8-K_2025-06-09' --> 'data\processed_data\GD\8-K_2025-06-09.md'


2025-11-14 16:41:52,048 - INFO - Finished converting document 8-K_2025-07-23 in 0.05 sec.
2025-11-14 16:41:52,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:41:52,100 - INFO - Going to convert document batch...
2025-11-14 16:41:52,101 - INFO - Processing document 8-K_2025-10-24
2025-11-14 16:41:52,126 - INFO - Finished converting document 8-K_2025-10-24 in 0.06 sec.
2025-11-14 16:41:52,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\8-K_2025-07-23' --> 'data\processed_data\GD\8-K_2025-07-23.md'
Converted 'data\edgar_documents\GD\8-K_2025-10-24' --> 'data\processed_data\GD\8-K_2025-10-24.md'


2025-11-14 16:41:53,042 - INFO - Going to convert document batch...
2025-11-14 16:41:53,042 - INFO - Processing document DEF-14A_2023-03-24
2025-11-14 16:41:54,733 - INFO - Finished converting document DEF-14A_2023-03-24 in 2.59 sec.
2025-11-14 16:41:55,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GD\DEF-14A_2023-03-24' --> 'data\processed_data\GD\DEF-14A_2023-03-24.md'


2025-11-14 16:41:56,607 - INFO - Going to convert document batch...
2025-11-14 16:41:56,608 - INFO - Processing document DEF-14A_2024-03-22
2025-11-14 16:41:58,154 - INFO - Finished converting document DEF-14A_2024-03-22 in 2.53 sec.


Converted 'data\edgar_documents\GD\DEF-14A_2024-03-22' --> 'data\processed_data\GD\DEF-14A_2024-03-22.md'


2025-11-14 16:41:59,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:42:00,497 - INFO - Going to convert document batch...
2025-11-14 16:42:00,498 - INFO - Processing document DEF-14A_2025-03-28
2025-11-14 16:42:12,453 - INFO - Finished converting document DEF-14A_2025-03-28 in 13.22 sec.


Converted 'data\edgar_documents\GD\DEF-14A_2025-03-28' --> 'data\processed_data\GD\DEF-14A_2025-03-28.md'
Processed 104 new files. Errors: 2
Found 106 files to process in data\edgar_documents\GE


2025-11-14 16:42:14,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:42:16,453 - INFO - Going to convert document batch...
2025-11-14 16:42:16,454 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:42:16,455 - INFO - Processing document 10-K_2023-02-10
2025-11-14 16:42:19,833 - INFO - Finished converting document 10-K_2023-02-10 in 5.97 sec.
2025-11-14 16:42:21,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-K_2023-02-10' --> 'data\processed_data\GE\10-K_2023-02-10.md'


2025-11-14 16:42:22,952 - INFO - Going to convert document batch...
2025-11-14 16:42:22,953 - INFO - Processing document 10-K_2024-02-02
2025-11-14 16:42:26,354 - INFO - Finished converting document 10-K_2024-02-02 in 5.11 sec.
2025-11-14 16:42:27,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-K_2024-02-02' --> 'data\processed_data\GE\10-K_2024-02-02.md'


2025-11-14 16:42:29,668 - INFO - Going to convert document batch...
2025-11-14 16:42:29,669 - INFO - Processing document 10-K_2025-02-03
2025-11-14 16:42:32,570 - INFO - Finished converting document 10-K_2025-02-03 in 4.78 sec.
2025-11-14 16:42:33,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-K_2025-02-03' --> 'data\processed_data\GE\10-K_2025-02-03.md'


2025-11-14 16:42:35,440 - INFO - Going to convert document batch...
2025-11-14 16:42:35,443 - INFO - Processing document 10-Q_2023-04-25
2025-11-14 16:42:37,103 - INFO - Finished converting document 10-Q_2023-04-25 in 3.30 sec.
2025-11-14 16:42:38,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-Q_2023-04-25' --> 'data\processed_data\GE\10-Q_2023-04-25.md'


2025-11-14 16:42:39,791 - INFO - Going to convert document batch...
2025-11-14 16:42:39,792 - INFO - Processing document 10-Q_2023-07-25
2025-11-14 16:42:41,405 - INFO - Finished converting document 10-Q_2023-07-25 in 3.33 sec.
2025-11-14 16:42:42,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-Q_2023-07-25' --> 'data\processed_data\GE\10-Q_2023-07-25.md'


2025-11-14 16:42:43,890 - INFO - Going to convert document batch...
2025-11-14 16:42:43,892 - INFO - Processing document 10-Q_2023-10-24
2025-11-14 16:42:45,776 - INFO - Finished converting document 10-Q_2023-10-24 in 3.22 sec.
2025-11-14 16:42:46,904 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-Q_2023-10-24' --> 'data\processed_data\GE\10-Q_2023-10-24.md'


2025-11-14 16:42:47,581 - INFO - Going to convert document batch...
2025-11-14 16:42:47,582 - INFO - Processing document 10-Q_2024-04-23
2025-11-14 16:42:49,287 - INFO - Finished converting document 10-Q_2024-04-23 in 2.44 sec.
2025-11-14 16:42:50,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-Q_2024-04-23' --> 'data\processed_data\GE\10-Q_2024-04-23.md'


2025-11-14 16:42:50,863 - INFO - Going to convert document batch...
2025-11-14 16:42:50,864 - INFO - Processing document 10-Q_2024-07-23
2025-11-14 16:42:52,131 - INFO - Finished converting document 10-Q_2024-07-23 in 2.02 sec.
2025-11-14 16:42:53,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-Q_2024-07-23' --> 'data\processed_data\GE\10-Q_2024-07-23.md'


2025-11-14 16:42:54,200 - INFO - Going to convert document batch...
2025-11-14 16:42:54,202 - INFO - Processing document 10-Q_2024-10-22
2025-11-14 16:42:55,326 - INFO - Finished converting document 10-Q_2024-10-22 in 2.33 sec.
2025-11-14 16:42:56,546 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-Q_2024-10-22' --> 'data\processed_data\GE\10-Q_2024-10-22.md'


2025-11-14 16:42:57,032 - INFO - Going to convert document batch...
2025-11-14 16:42:57,033 - INFO - Processing document 10-Q_2025-04-22
2025-11-14 16:42:57,865 - INFO - Finished converting document 10-Q_2025-04-22 in 1.38 sec.
2025-11-14 16:42:58,558 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-Q_2025-04-22' --> 'data\processed_data\GE\10-Q_2025-04-22.md'


2025-11-14 16:42:59,542 - INFO - Going to convert document batch...
2025-11-14 16:42:59,542 - INFO - Processing document 10-Q_2025-07-21
2025-11-14 16:43:00,678 - INFO - Finished converting document 10-Q_2025-07-21 in 2.16 sec.
2025-11-14 16:43:01,793 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\10-Q_2025-07-21' --> 'data\processed_data\GE\10-Q_2025-07-21.md'


2025-11-14 16:43:02,906 - INFO - Going to convert document batch...
2025-11-14 16:43:02,906 - INFO - Processing document 10-Q_2025-10-21
2025-11-14 16:43:03,975 - INFO - Finished converting document 10-Q_2025-10-21 in 2.28 sec.
2025-11-14 16:43:04,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:04,972 - INFO - Going to convert document batch...
2025-11-14 16:43:04,972 - INFO - Processing document 4_2023-01-05
2025-11-14 16:43:04,999 - INFO - Finished converting document 4_2023-01-05 in 0.05 sec.
2025-11-14 16:43:05,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:05,059 - INFO - Going to convert document batch...
2025-11-14 16:43:05,059 - INFO - Processing document 4_2023-03-02
2025-11-14 16:43:05,089 - INFO - Finished converting document 4_2023-03-02 in 0.06 sec.


Converted 'data\edgar_documents\GE\10-Q_2025-10-21' --> 'data\processed_data\GE\10-Q_2025-10-21.md'
Converted 'data\edgar_documents\GE\4_2023-01-05' --> 'data\processed_data\GE\4_2023-01-05.md'


2025-11-14 16:43:05,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:05,167 - INFO - Going to convert document batch...
2025-11-14 16:43:05,168 - INFO - Processing document 4_2023-03-06
2025-11-14 16:43:05,194 - INFO - Finished converting document 4_2023-03-06 in 0.05 sec.
2025-11-14 16:43:05,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:05,252 - INFO - Going to convert document batch...
2025-11-14 16:43:05,253 - INFO - Processing document 4_2023-04-04
2025-11-14 16:43:05,293 - INFO - Finished converting document 4_2023-04-04 in 0.08 sec.


Converted 'data\edgar_documents\GE\4_2023-03-02' --> 'data\processed_data\GE\4_2023-03-02.md'
Converted 'data\edgar_documents\GE\4_2023-03-06' --> 'data\processed_data\GE\4_2023-03-06.md'
Converted 'data\edgar_documents\GE\4_2023-04-04' --> 'data\processed_data\GE\4_2023-04-04.md'


2025-11-14 16:43:05,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:05,366 - INFO - Going to convert document batch...
2025-11-14 16:43:05,367 - INFO - Processing document 4_2023-04-11
2025-11-14 16:43:05,408 - INFO - Finished converting document 4_2023-04-11 in 0.08 sec.
2025-11-14 16:43:05,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:05,469 - INFO - Going to convert document batch...
2025-11-14 16:43:05,471 - INFO - Processing document 4_2023-05-03
2025-11-14 16:43:05,498 - INFO - Finished converting document 4_2023-05-03 in 0.06 sec.
2025-11-14 16:43:05,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:05,567 - INFO - Going to convert document batch...
2025-11-14 16:43:05,567 - INFO - Processing document 4_2023-05-12
2025-11-14 16:43:05,608 - INFO - Finished converting document 4_2023-05-12 in 0.08 sec.


Converted 'data\edgar_documents\GE\4_2023-04-11' --> 'data\processed_data\GE\4_2023-04-11.md'
Converted 'data\edgar_documents\GE\4_2023-05-03' --> 'data\processed_data\GE\4_2023-05-03.md'


2025-11-14 16:43:05,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:05,672 - INFO - Going to convert document batch...
2025-11-14 16:43:05,674 - INFO - Processing document 4_2023-05-24
2025-11-14 16:43:05,706 - INFO - Finished converting document 4_2023-05-24 in 0.06 sec.
2025-11-14 16:43:05,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:05,790 - INFO - Going to convert document batch...
2025-11-14 16:43:05,791 - INFO - Processing document 4_2023-06-12
2025-11-14 16:43:05,814 - INFO - Finished converting document 4_2023-06-12 in 0.06 sec.


Converted 'data\edgar_documents\GE\4_2023-05-12' --> 'data\processed_data\GE\4_2023-05-12.md'
Converted 'data\edgar_documents\GE\4_2023-05-24' --> 'data\processed_data\GE\4_2023-05-24.md'


2025-11-14 16:43:05,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:05,869 - INFO - Going to convert document batch...
2025-11-14 16:43:05,870 - INFO - Processing document 4_2023-06-14
2025-11-14 16:43:05,970 - INFO - Finished converting document 4_2023-06-14 in 0.12 sec.


Converted 'data\edgar_documents\GE\4_2023-06-12' --> 'data\processed_data\GE\4_2023-06-12.md'
Converted 'data\edgar_documents\GE\4_2023-06-14' --> 'data\processed_data\GE\4_2023-06-14.md'


2025-11-14 16:43:06,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:06,079 - INFO - Going to convert document batch...
2025-11-14 16:43:06,080 - INFO - Processing document 4_2023-06-23
2025-11-14 16:43:06,112 - INFO - Finished converting document 4_2023-06-23 in 0.09 sec.
2025-11-14 16:43:06,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:06,167 - INFO - Going to convert document batch...
2025-11-14 16:43:06,168 - INFO - Processing document 4_2023-07-05
2025-11-14 16:43:06,200 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 16:43:06,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:06,277 - INFO - Going to convert document batch...
2025-11-14 16:43:06,279 - INFO - Processing document 4_2023-07-31
2025-11-14 16:43:06,302 - INFO - Finished converting document 4_2023-07-31 in 0.06 sec.


Converted 'data\edgar_documents\GE\4_2023-06-23' --> 'data\processed_data\GE\4_2023-06-23.md'
Converted 'data\edgar_documents\GE\4_2023-07-05' --> 'data\processed_data\GE\4_2023-07-05.md'
Converted 'data\edgar_documents\GE\4_2023-07-31' --> 'data\processed_data\GE\4_2023-07-31.md'


2025-11-14 16:43:06,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:06,400 - INFO - Going to convert document batch...
2025-11-14 16:43:06,401 - INFO - Processing document 4_2023-09-06
2025-11-14 16:43:06,446 - INFO - Finished converting document 4_2023-09-06 in 0.09 sec.
2025-11-14 16:43:06,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:06,526 - INFO - Going to convert document batch...
2025-11-14 16:43:06,528 - INFO - Processing document 4_2023-10-03
2025-11-14 16:43:06,605 - INFO - Finished converting document 4_2023-10-03 in 0.12 sec.


Converted 'data\edgar_documents\GE\4_2023-09-06' --> 'data\processed_data\GE\4_2023-09-06.md'
Converted 'data\edgar_documents\GE\4_2023-10-03' --> 'data\processed_data\GE\4_2023-10-03.md'


2025-11-14 16:43:06,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:06,722 - INFO - Going to convert document batch...
2025-11-14 16:43:06,723 - INFO - Processing document 4_2023-11-21
2025-11-14 16:43:06,752 - INFO - Finished converting document 4_2023-11-21 in 0.09 sec.
2025-11-14 16:43:06,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:06,800 - INFO - Going to convert document batch...
2025-11-14 16:43:06,800 - INFO - Processing document 4_2024-01-03
2025-11-14 16:43:06,823 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 16:43:06,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:06,869 - INFO - Going to convert document batch...
2025-11-14 16:43:06,870 - INFO - Processing document 4_2024-02-05
2025-11-14 16:43:06,890 - INFO - Finished converting document 4_2024-02-05 in 0.05 sec.
2025-11-14 16:43:06,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GE\4_2023-11-21' --> 'data\processed_data\GE\4_2023-11-21.md'
Converted 'data\edgar_documents\GE\4_2024-01-03' --> 'data\processed_data\GE\4_2024-01-03.md'
Converted 'data\edgar_documents\GE\4_2024-02-05' --> 'data\processed_data\GE\4_2024-02-05.md'


2025-11-14 16:43:07,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:07,015 - INFO - Going to convert document batch...
2025-11-14 16:43:07,016 - INFO - Processing document 4_2024-02-21
2025-11-14 16:43:07,097 - INFO - Finished converting document 4_2024-02-21 in 0.11 sec.
2025-11-14 16:43:07,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\4_2024-02-16' --> 'data\processed_data\GE\4_2024-02-16.md'
Converted 'data\edgar_documents\GE\4_2024-02-21' --> 'data\processed_data\GE\4_2024-02-21.md'


2025-11-14 16:43:07,210 - INFO - Going to convert document batch...
2025-11-14 16:43:07,212 - INFO - Processing document 4_2024-02-27
2025-11-14 16:43:07,256 - INFO - Finished converting document 4_2024-02-27 in 0.11 sec.
2025-11-14 16:43:07,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:07,350 - INFO - Going to convert document batch...
2025-11-14 16:43:07,351 - INFO - Processing document 4_2024-03-05
2025-11-14 16:43:07,387 - INFO - Finished converting document 4_2024-03-05 in 0.09 sec.
2025-11-14 16:43:07,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:07,438 - INFO - Going to convert document batch...
2025-11-14 16:43:07,439 - INFO - Processing document 4_2024-03-15
2025-11-14 16:43:07,459 - INFO - Finished converting document 4_2024-03-15 in 0.03 sec.


Converted 'data\edgar_documents\GE\4_2024-02-27' --> 'data\processed_data\GE\4_2024-02-27.md'
Converted 'data\edgar_documents\GE\4_2024-03-05' --> 'data\processed_data\GE\4_2024-03-05.md'
Converted 'data\edgar_documents\GE\4_2024-03-15' --> 'data\processed_data\GE\4_2024-03-15.md'


2025-11-14 16:43:07,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:07,523 - INFO - Going to convert document batch...
2025-11-14 16:43:07,524 - INFO - Processing document 4_2024-04-01
2025-11-14 16:43:07,550 - INFO - Finished converting document 4_2024-04-01 in 0.06 sec.
2025-11-14 16:43:07,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:07,605 - INFO - Going to convert document batch...
2025-11-14 16:43:07,606 - INFO - Processing document 4_2024-04-04
2025-11-14 16:43:07,625 - INFO - Finished converting document 4_2024-04-04 in 0.05 sec.
2025-11-14 16:43:07,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:07,669 - INFO - Going to convert document batch...
2025-11-14 16:43:07,669 - INFO - Processing document 4_2024-05-03
2025-11-14 16:43:07,691 - INFO - Finished converting document 4_2024-05-03 in 0.05 sec.
2025-11-14 16:43:07,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GE\4_2024-04-01' --> 'data\processed_data\GE\4_2024-04-01.md'
Converted 'data\edgar_documents\GE\4_2024-04-04' --> 'data\processed_data\GE\4_2024-04-04.md'
Converted 'data\edgar_documents\GE\4_2024-05-03' --> 'data\processed_data\GE\4_2024-05-03.md'


2025-11-14 16:43:07,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:07,816 - INFO - Going to convert document batch...
2025-11-14 16:43:07,817 - INFO - Processing document 4_2024-05-23
2025-11-14 16:43:07,840 - INFO - Finished converting document 4_2024-05-23 in 0.06 sec.
2025-11-14 16:43:07,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:07,895 - INFO - Going to convert document batch...
2025-11-14 16:43:07,898 - INFO - Processing document 4_2024-05-24
2025-11-14 16:43:07,930 - INFO - Finished converting document 4_2024-05-24 in 0.05 sec.
2025-11-14 16:43:07,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\4_2024-05-08' --> 'data\processed_data\GE\4_2024-05-08.md'
Converted 'data\edgar_documents\GE\4_2024-05-23' --> 'data\processed_data\GE\4_2024-05-23.md'
Converted 'data\edgar_documents\GE\4_2024-05-24' --> 'data\processed_data\GE\4_2024-05-24.md'


2025-11-14 16:43:07,980 - INFO - Going to convert document batch...
2025-11-14 16:43:07,980 - INFO - Processing document 4_2024-07-02
2025-11-14 16:43:08,092 - INFO - Finished converting document 4_2024-07-02 in 0.14 sec.
2025-11-14 16:43:08,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:08,191 - INFO - Going to convert document batch...
2025-11-14 16:43:08,193 - INFO - Processing document 4_2024-08-06
2025-11-14 16:43:08,221 - INFO - Finished converting document 4_2024-08-06 in 0.09 sec.
2025-11-14 16:43:08,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:08,269 - INFO - Going to convert document batch...
2025-11-14 16:43:08,270 - INFO - Processing document 4_2024-08-20
2025-11-14 16:43:08,295 - INFO - Finished converting document 4_2024-08-20 in 0.05 sec.


Converted 'data\edgar_documents\GE\4_2024-07-02' --> 'data\processed_data\GE\4_2024-07-02.md'
Converted 'data\edgar_documents\GE\4_2024-08-06' --> 'data\processed_data\GE\4_2024-08-06.md'


2025-11-14 16:43:08,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:08,346 - INFO - Going to convert document batch...
2025-11-14 16:43:08,348 - INFO - Processing document 4_2024-09-04
2025-11-14 16:43:08,386 - INFO - Finished converting document 4_2024-09-04 in 0.08 sec.
2025-11-14 16:43:08,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:08,440 - INFO - Going to convert document batch...
2025-11-14 16:43:08,441 - INFO - Processing document 4_2024-09-05
2025-11-14 16:43:08,466 - INFO - Finished converting document 4_2024-09-05 in 0.05 sec.
2025-11-14 16:43:08,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\4_2024-08-20' --> 'data\processed_data\GE\4_2024-08-20.md'
Converted 'data\edgar_documents\GE\4_2024-09-04' --> 'data\processed_data\GE\4_2024-09-04.md'
Converted 'data\edgar_documents\GE\4_2024-09-05' --> 'data\processed_data\GE\4_2024-09-05.md'


2025-11-14 16:43:08,512 - INFO - Going to convert document batch...
2025-11-14 16:43:08,514 - INFO - Processing document 4_2024-10-02
2025-11-14 16:43:08,641 - INFO - Finished converting document 4_2024-10-02 in 0.16 sec.
2025-11-14 16:43:08,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:08,738 - INFO - Going to convert document batch...
2025-11-14 16:43:08,739 - INFO - Processing document 4_2024-11-07
2025-11-14 16:43:08,765 - INFO - Finished converting document 4_2024-11-07 in 0.09 sec.
2025-11-14 16:43:08,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:08,811 - INFO - Going to convert document batch...
2025-11-14 16:43:08,811 - INFO - Processing document 4_2024-11-20
2025-11-14 16:43:08,838 - INFO - Finished converting document 4_2024-11-20 in 0.05 sec.


Converted 'data\edgar_documents\GE\4_2024-10-02' --> 'data\processed_data\GE\4_2024-10-02.md'
Converted 'data\edgar_documents\GE\4_2024-11-07' --> 'data\processed_data\GE\4_2024-11-07.md'


2025-11-14 16:43:08,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:08,903 - INFO - Going to convert document batch...
2025-11-14 16:43:08,904 - INFO - Processing document 4_2024-11-25
2025-11-14 16:43:08,944 - INFO - Finished converting document 4_2024-11-25 in 0.06 sec.
2025-11-14 16:43:08,981 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:08,988 - INFO - Going to convert document batch...
2025-11-14 16:43:08,989 - INFO - Processing document 4_2025-01-03
2025-11-14 16:43:09,008 - INFO - Finished converting document 4_2025-01-03 in 0.03 sec.
2025-11-14 16:43:09,059 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\4_2024-11-20' --> 'data\processed_data\GE\4_2024-11-20.md'
Converted 'data\edgar_documents\GE\4_2024-11-25' --> 'data\processed_data\GE\4_2024-11-25.md'
Converted 'data\edgar_documents\GE\4_2025-01-03' --> 'data\processed_data\GE\4_2025-01-03.md'


2025-11-14 16:43:09,068 - INFO - Going to convert document batch...
2025-11-14 16:43:09,069 - INFO - Processing document 4_2025-01-08
2025-11-14 16:43:09,099 - INFO - Finished converting document 4_2025-01-08 in 0.06 sec.
2025-11-14 16:43:09,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:09,151 - INFO - Going to convert document batch...
2025-11-14 16:43:09,152 - INFO - Processing document 4_2025-02-25
2025-11-14 16:43:09,175 - INFO - Finished converting document 4_2025-02-25 in 0.05 sec.
2025-11-14 16:43:09,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:09,238 - INFO - Going to convert document batch...
2025-11-14 16:43:09,239 - INFO - Processing document 4_2025-03-04
2025-11-14 16:43:09,268 - INFO - Finished converting document 4_2025-03-04 in 0.05 sec.
2025-11-14 16:43:09,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\4_2025-01-08' --> 'data\processed_data\GE\4_2025-01-08.md'
Converted 'data\edgar_documents\GE\4_2025-02-25' --> 'data\processed_data\GE\4_2025-02-25.md'
Converted 'data\edgar_documents\GE\4_2025-03-04' --> 'data\processed_data\GE\4_2025-03-04.md'


2025-11-14 16:43:09,320 - INFO - Going to convert document batch...
2025-11-14 16:43:09,321 - INFO - Processing document 4_2025-03-05
2025-11-14 16:43:09,348 - INFO - Finished converting document 4_2025-03-05 in 0.05 sec.
2025-11-14 16:43:09,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:09,403 - INFO - Going to convert document batch...
2025-11-14 16:43:09,404 - INFO - Processing document 4_2025-04-02
2025-11-14 16:43:09,423 - INFO - Finished converting document 4_2025-04-02 in 0.05 sec.
2025-11-14 16:43:09,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:09,471 - INFO - Going to convert document batch...
2025-11-14 16:43:09,472 - INFO - Processing document 4_2025-04-28
2025-11-14 16:43:09,498 - INFO - Finished converting document 4_2025-04-28 in 0.05 sec.
2025-11-14 16:43:09,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:09,546 - INFO - Going to convert document batch...
2025-11-14 16:43:09,547 - 

Converted 'data\edgar_documents\GE\4_2025-03-05' --> 'data\processed_data\GE\4_2025-03-05.md'
Converted 'data\edgar_documents\GE\4_2025-04-02' --> 'data\processed_data\GE\4_2025-04-02.md'
Converted 'data\edgar_documents\GE\4_2025-04-28' --> 'data\processed_data\GE\4_2025-04-28.md'


2025-11-14 16:43:09,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:09,627 - INFO - Going to convert document batch...
2025-11-14 16:43:09,628 - INFO - Processing document 4_2025-05-07
2025-11-14 16:43:09,658 - INFO - Finished converting document 4_2025-05-07 in 0.05 sec.
2025-11-14 16:43:09,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\4_2025-05-01' --> 'data\processed_data\GE\4_2025-05-01.md'
Converted 'data\edgar_documents\GE\4_2025-05-07' --> 'data\processed_data\GE\4_2025-05-07.md'


2025-11-14 16:43:09,814 - INFO - Going to convert document batch...
2025-11-14 16:43:09,827 - INFO - Processing document 4_2025-05-14
2025-11-14 16:43:09,859 - INFO - Finished converting document 4_2025-05-14 in 0.17 sec.
2025-11-14 16:43:09,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:09,957 - INFO - Going to convert document batch...
2025-11-14 16:43:09,958 - INFO - Processing document 4_2025-06-03
2025-11-14 16:43:09,996 - INFO - Finished converting document 4_2025-06-03 in 0.11 sec.
2025-11-14 16:43:10,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:10,053 - INFO - Going to convert document batch...
2025-11-14 16:43:10,054 - INFO - Processing document 4_2025-07-01
2025-11-14 16:43:10,075 - INFO - Finished converting document 4_2025-07-01 in 0.06 sec.


Converted 'data\edgar_documents\GE\4_2025-05-14' --> 'data\processed_data\GE\4_2025-05-14.md'
Converted 'data\edgar_documents\GE\4_2025-06-03' --> 'data\processed_data\GE\4_2025-06-03.md'


2025-11-14 16:43:10,125 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:43:10,127 - ERROR - Input document 4_2025-07-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:43:10,128 - INFO - Going to convert document batch...
2025-11-14 16:43:10,153 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:43:10,154 - ERROR - Input document 4_2025-07-24 with format None does not match any allowed format: (dict_keys

Converted 'data\edgar_documents\GE\4_2025-07-01' --> 'data\processed_data\GE\4_2025-07-01.md'
Error processing data\edgar_documents\GE\4_2025-07-22: File format not allowed: data\edgar_documents\GE\4_2025-07-22
Error processing data\edgar_documents\GE\4_2025-07-24: File format not allowed: data\edgar_documents\GE\4_2025-07-24


2025-11-14 16:43:10,844 - INFO - Finished converting document 4_2025-08-06 in 0.69 sec.
2025-11-14 16:43:10,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:10,945 - INFO - Going to convert document batch...
2025-11-14 16:43:10,946 - INFO - Processing document 4_2025-09-03
2025-11-14 16:43:10,973 - INFO - Finished converting document 4_2025-09-03 in 0.08 sec.
2025-11-14 16:43:11,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:11,019 - INFO - Going to convert document batch...
2025-11-14 16:43:11,020 - INFO - Processing document 4_2025-10-02
2025-11-14 16:43:11,041 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 16:43:11,086 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\4_2025-08-06' --> 'data\processed_data\GE\4_2025-08-06.md'
Converted 'data\edgar_documents\GE\4_2025-09-03' --> 'data\processed_data\GE\4_2025-09-03.md'
Converted 'data\edgar_documents\GE\4_2025-10-02' --> 'data\processed_data\GE\4_2025-10-02.md'


2025-11-14 16:43:11,105 - INFO - Going to convert document batch...
2025-11-14 16:43:11,105 - INFO - Processing document 8-K_2023-01-04
2025-11-14 16:43:11,151 - INFO - Finished converting document 8-K_2023-01-04 in 0.09 sec.
2025-11-14 16:43:11,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:11,212 - INFO - Going to convert document batch...
2025-11-14 16:43:11,213 - INFO - Processing document 8-K_2023-01-09
2025-11-14 16:43:11,237 - INFO - Finished converting document 8-K_2023-01-09 in 0.06 sec.
2025-11-14 16:43:11,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:11,285 - INFO - Going to convert document batch...
2025-11-14 16:43:11,286 - INFO - Processing document 8-K_2023-01-10
2025-11-14 16:43:11,307 - INFO - Finished converting document 8-K_2023-01-10 in 0.05 sec.
2025-11-14 16:43:11,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:11,355 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GE\8-K_2023-01-04' --> 'data\processed_data\GE\8-K_2023-01-04.md'
Converted 'data\edgar_documents\GE\8-K_2023-01-09' --> 'data\processed_data\GE\8-K_2023-01-09.md'
Converted 'data\edgar_documents\GE\8-K_2023-01-10' --> 'data\processed_data\GE\8-K_2023-01-10.md'


2025-11-14 16:43:11,356 - INFO - Processing document 8-K_2023-01-24
2025-11-14 16:43:11,403 - INFO - Finished converting document 8-K_2023-01-24 in 0.08 sec.
2025-11-14 16:43:11,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:11,459 - INFO - Going to convert document batch...
2025-11-14 16:43:11,461 - INFO - Processing document 8-K_2023-02-13
2025-11-14 16:43:11,482 - INFO - Finished converting document 8-K_2023-02-13 in 0.06 sec.
2025-11-14 16:43:11,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:11,553 - INFO - Going to convert document batch...
2025-11-14 16:43:11,553 - INFO - Processing document 8-K_2023-02-15
2025-11-14 16:43:11,585 - INFO - Finished converting document 8-K_2023-02-15 in 0.08 sec.
2025-11-14 16:43:11,617 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\8-K_2023-01-24' --> 'data\processed_data\GE\8-K_2023-01-24.md'
Converted 'data\edgar_documents\GE\8-K_2023-02-13' --> 'data\processed_data\GE\8-K_2023-02-13.md'
Converted 'data\edgar_documents\GE\8-K_2023-02-15' --> 'data\processed_data\GE\8-K_2023-02-15.md'


2025-11-14 16:43:11,643 - INFO - Going to convert document batch...
2025-11-14 16:43:11,644 - INFO - Processing document 8-K_2023-02-27
2025-11-14 16:43:11,694 - INFO - Finished converting document 8-K_2023-02-27 in 0.09 sec.
2025-11-14 16:43:11,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:11,756 - INFO - Going to convert document batch...
2025-11-14 16:43:11,757 - INFO - Processing document 8-K_2023-03-14
2025-11-14 16:43:11,780 - INFO - Finished converting document 8-K_2023-03-14 in 0.06 sec.
2025-11-14 16:43:11,816 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\8-K_2023-02-27' --> 'data\processed_data\GE\8-K_2023-02-27.md'
Converted 'data\edgar_documents\GE\8-K_2023-03-14' --> 'data\processed_data\GE\8-K_2023-03-14.md'


2025-11-14 16:43:12,011 - INFO - Going to convert document batch...
2025-11-14 16:43:12,012 - INFO - Processing document 8-K_2023-04-25
2025-11-14 16:43:12,205 - INFO - Finished converting document 8-K_2023-04-25 in 0.41 sec.
2025-11-14 16:43:12,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:12,323 - INFO - Going to convert document batch...
2025-11-14 16:43:12,324 - INFO - Processing document 8-K_2023-05-08
2025-11-14 16:43:12,386 - INFO - Finished converting document 8-K_2023-05-08 in 0.17 sec.


Converted 'data\edgar_documents\GE\8-K_2023-04-25' --> 'data\processed_data\GE\8-K_2023-04-25.md'
Converted 'data\edgar_documents\GE\8-K_2023-05-08' --> 'data\processed_data\GE\8-K_2023-05-08.md'


2025-11-14 16:43:12,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:12,491 - INFO - Going to convert document batch...
2025-11-14 16:43:12,494 - INFO - Processing document 8-K_2023-05-17
2025-11-14 16:43:12,518 - INFO - Finished converting document 8-K_2023-05-17 in 0.11 sec.
2025-11-14 16:43:12,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:12,572 - INFO - Going to convert document batch...
2025-11-14 16:43:12,573 - INFO - Processing document 8-K_2023-05-18
2025-11-14 16:43:12,598 - INFO - Finished converting document 8-K_2023-05-18 in 0.06 sec.
2025-11-14 16:43:12,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:12,642 - INFO - Going to convert document batch...
2025-11-14 16:43:12,643 - INFO - Processing document 8-K_2023-07-25
2025-11-14 16:43:12,668 - INFO - Finished converting document 8-K_2023-07-25 in 0.06 sec.
2025-11-14 16:43:12,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\8-K_2023-05-17' --> 'data\processed_data\GE\8-K_2023-05-17.md'
Converted 'data\edgar_documents\GE\8-K_2023-05-18' --> 'data\processed_data\GE\8-K_2023-05-18.md'
Converted 'data\edgar_documents\GE\8-K_2023-07-25' --> 'data\processed_data\GE\8-K_2023-07-25.md'


2025-11-14 16:43:12,733 - INFO - Going to convert document batch...
2025-11-14 16:43:12,733 - INFO - Processing document 8-K_2023-10-24
2025-11-14 16:43:12,789 - INFO - Finished converting document 8-K_2023-10-24 in 0.09 sec.
2025-11-14 16:43:12,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:12,887 - INFO - Going to convert document batch...
2025-11-14 16:43:12,888 - INFO - Processing document 8-K_2023-11-14
2025-11-14 16:43:12,916 - INFO - Finished converting document 8-K_2023-11-14 in 0.11 sec.
2025-11-14 16:43:12,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:12,980 - INFO - Going to convert document batch...
2025-11-14 16:43:12,980 - INFO - Processing document 8-K_2024-01-16


Converted 'data\edgar_documents\GE\8-K_2023-10-24' --> 'data\processed_data\GE\8-K_2023-10-24.md'
Converted 'data\edgar_documents\GE\8-K_2023-11-14' --> 'data\processed_data\GE\8-K_2023-11-14.md'


2025-11-14 16:43:13,004 - INFO - Finished converting document 8-K_2024-01-16 in 0.06 sec.
2025-11-14 16:43:13,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:13,060 - INFO - Going to convert document batch...
2025-11-14 16:43:13,061 - INFO - Processing document 8-K_2024-01-23
2025-11-14 16:43:13,089 - INFO - Finished converting document 8-K_2024-01-23 in 0.08 sec.
2025-11-14 16:43:13,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:13,130 - INFO - Going to convert document batch...
2025-11-14 16:43:13,130 - INFO - Processing document 8-K_2024-02-29
2025-11-14 16:43:13,152 - INFO - Finished converting document 8-K_2024-02-29 in 0.05 sec.
2025-11-14 16:43:13,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:13,197 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GE\8-K_2024-01-16' --> 'data\processed_data\GE\8-K_2024-01-16.md'
Converted 'data\edgar_documents\GE\8-K_2024-01-23' --> 'data\processed_data\GE\8-K_2024-01-23.md'
Converted 'data\edgar_documents\GE\8-K_2024-02-29' --> 'data\processed_data\GE\8-K_2024-02-29.md'


2025-11-14 16:43:13,198 - INFO - Processing document 8-K_2024-03-07
2025-11-14 16:43:13,232 - INFO - Finished converting document 8-K_2024-03-07 in 0.06 sec.
2025-11-14 16:43:13,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:13,291 - INFO - Going to convert document batch...
2025-11-14 16:43:13,293 - INFO - Processing document 8-K_2024-04-02
2025-11-14 16:43:13,329 - INFO - Finished converting document 8-K_2024-04-02 in 0.08 sec.
2025-11-14 16:43:13,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:13,372 - INFO - Going to convert document batch...
2025-11-14 16:43:13,373 - INFO - Processing document 8-K_2024-04-08
2025-11-14 16:43:13,402 - INFO - Finished converting document 8-K_2024-04-08 in 0.06 sec.
2025-11-14 16:43:13,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\8-K_2024-03-07' --> 'data\processed_data\GE\8-K_2024-03-07.md'
Converted 'data\edgar_documents\GE\8-K_2024-04-02' --> 'data\processed_data\GE\8-K_2024-04-02.md'
Converted 'data\edgar_documents\GE\8-K_2024-04-08' --> 'data\processed_data\GE\8-K_2024-04-08.md'


2025-11-14 16:43:13,453 - INFO - Going to convert document batch...
2025-11-14 16:43:13,454 - INFO - Processing document 8-K_2024-04-11
2025-11-14 16:43:13,504 - INFO - Finished converting document 8-K_2024-04-11 in 0.08 sec.
2025-11-14 16:43:13,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:13,551 - INFO - Going to convert document batch...
2025-11-14 16:43:13,552 - INFO - Processing document 8-K_2024-04-23
2025-11-14 16:43:13,576 - INFO - Finished converting document 8-K_2024-04-23 in 0.06 sec.
2025-11-14 16:43:13,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:13,626 - INFO - Going to convert document batch...
2025-11-14 16:43:13,627 - INFO - Processing document 8-K_2024-05-10
2025-11-14 16:43:13,658 - INFO - Finished converting document 8-K_2024-05-10 in 0.06 sec.
2025-11-14 16:43:13,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:13,704 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GE\8-K_2024-04-11' --> 'data\processed_data\GE\8-K_2024-04-11.md'
Converted 'data\edgar_documents\GE\8-K_2024-04-23' --> 'data\processed_data\GE\8-K_2024-04-23.md'
Converted 'data\edgar_documents\GE\8-K_2024-05-10' --> 'data\processed_data\GE\8-K_2024-05-10.md'


2025-11-14 16:43:13,705 - INFO - Processing document 8-K_2024-06-21
2025-11-14 16:43:13,740 - INFO - Finished converting document 8-K_2024-06-21 in 0.06 sec.
2025-11-14 16:43:13,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:13,805 - INFO - Going to convert document batch...
2025-11-14 16:43:13,805 - INFO - Processing document 8-K_2024-07-01
2025-11-14 16:43:13,931 - INFO - Finished converting document 8-K_2024-07-01 in 0.16 sec.


Converted 'data\edgar_documents\GE\8-K_2024-06-21' --> 'data\processed_data\GE\8-K_2024-06-21.md'
Converted 'data\edgar_documents\GE\8-K_2024-07-01' --> 'data\processed_data\GE\8-K_2024-07-01.md'


2025-11-14 16:43:14,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:14,032 - INFO - Going to convert document batch...
2025-11-14 16:43:14,033 - INFO - Processing document 8-K_2024-07-23
2025-11-14 16:43:14,067 - INFO - Finished converting document 8-K_2024-07-23 in 0.11 sec.
2025-11-14 16:43:14,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\8-K_2024-07-23' --> 'data\processed_data\GE\8-K_2024-07-23.md'


2025-11-14 16:43:14,420 - INFO - Going to convert document batch...
2025-11-14 16:43:14,421 - INFO - Processing document 8-K_2024-10-22
2025-11-14 16:43:14,441 - INFO - Finished converting document 8-K_2024-10-22 in 0.36 sec.
2025-11-14 16:43:14,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:14,555 - INFO - Going to convert document batch...
2025-11-14 16:43:14,556 - INFO - Processing document 8-K_2025-01-23
2025-11-14 16:43:14,597 - INFO - Finished converting document 8-K_2025-01-23 in 0.12 sec.
2025-11-14 16:43:14,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\8-K_2024-10-22' --> 'data\processed_data\GE\8-K_2024-10-22.md'
Converted 'data\edgar_documents\GE\8-K_2025-01-23' --> 'data\processed_data\GE\8-K_2025-01-23.md'


2025-11-14 16:43:14,687 - INFO - Going to convert document batch...
2025-11-14 16:43:14,688 - INFO - Processing document 8-K_2025-04-22
2025-11-14 16:43:14,716 - INFO - Finished converting document 8-K_2025-04-22 in 0.11 sec.
2025-11-14 16:43:14,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:14,767 - INFO - Going to convert document batch...
2025-11-14 16:43:14,768 - INFO - Processing document 8-K_2025-05-09
2025-11-14 16:43:14,800 - INFO - Finished converting document 8-K_2025-05-09 in 0.06 sec.
2025-11-14 16:43:14,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:14,851 - INFO - Going to convert document batch...
2025-11-14 16:43:14,851 - INFO - Processing document 8-K_2025-07-17
2025-11-14 16:43:14,886 - INFO - Finished converting document 8-K_2025-07-17 in 0.08 sec.
2025-11-14 16:43:14,914 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:43:14,917 - ERROR - In

Converted 'data\edgar_documents\GE\8-K_2025-04-22' --> 'data\processed_data\GE\8-K_2025-04-22.md'
Converted 'data\edgar_documents\GE\8-K_2025-05-09' --> 'data\processed_data\GE\8-K_2025-05-09.md'
Converted 'data\edgar_documents\GE\8-K_2025-07-17' --> 'data\processed_data\GE\8-K_2025-07-17.md'


2025-11-14 16:43:14,918 - INFO - Going to convert document batch...
2025-11-14 16:43:14,932 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:43:14,933 - ERROR - Input document 8-K_2025-07-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:43:14,935 - INFO - Going to convert document batch...
2025-11-14 16:43:14,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:43:14,970 - INFO - Going to convert document batch

Error processing data\edgar_documents\GE\8-K_2025-07-24: File format not allowed: data\edgar_documents\GE\8-K_2025-07-24
Error processing data\edgar_documents\GE\8-K_2025-07-29: File format not allowed: data\edgar_documents\GE\8-K_2025-07-29
Converted 'data\edgar_documents\GE\8-K_2025-10-01' --> 'data\processed_data\GE\8-K_2025-10-01.md'
Converted 'data\edgar_documents\GE\8-K_2025-10-21' --> 'data\processed_data\GE\8-K_2025-10-21.md'


2025-11-14 16:43:15,276 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:43:15,276 - ERROR - Input document DEF-14A_2023-03-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:43:15,279 - INFO - Going to convert document batch...
2025-11-14 16:43:15,314 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\GE\DEF-14A_2023-03-16: File format not allowed: data\edgar_documents\GE\DEF-14A_2023-03-16


2025-11-14 16:43:15,843 - INFO - Going to convert document batch...
2025-11-14 16:43:15,844 - INFO - Processing document DEF-14A_2024-03-14
2025-11-14 16:43:17,899 - INFO - Finished converting document DEF-14A_2024-03-14 in 2.61 sec.
2025-11-14 16:43:19,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\DEF-14A_2024-03-14' --> 'data\processed_data\GE\DEF-14A_2024-03-14.md'


2025-11-14 16:43:20,176 - INFO - Going to convert document batch...
2025-11-14 16:43:20,176 - INFO - Processing document DEF-14A_2025-03-13
2025-11-14 16:43:30,334 - INFO - Finished converting document DEF-14A_2025-03-13 in 11.38 sec.
2025-11-14 16:43:31,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GE\DEF-14A_2025-03-13' --> 'data\processed_data\GE\DEF-14A_2025-03-13.md'
Processed 101 new files. Errors: 5
Found 143 files to process in data\edgar_documents\GILD


2025-11-14 16:43:33,017 - INFO - Going to convert document batch...
2025-11-14 16:43:33,018 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:43:33,018 - INFO - Processing document 10-K_2023-02-22
2025-11-14 16:43:34,869 - INFO - Finished converting document 10-K_2023-02-22 in 3.48 sec.
2025-11-14 16:43:35,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-K_2023-02-22' --> 'data\processed_data\GILD\10-K_2023-02-22.md'


2025-11-14 16:43:36,731 - INFO - Going to convert document batch...
2025-11-14 16:43:36,732 - INFO - Processing document 10-K_2024-02-23
2025-11-14 16:43:38,713 - INFO - Finished converting document 10-K_2024-02-23 in 3.14 sec.
2025-11-14 16:43:39,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-K_2024-02-23' --> 'data\processed_data\GILD\10-K_2024-02-23.md'


2025-11-14 16:43:41,141 - INFO - Going to convert document batch...
2025-11-14 16:43:41,142 - INFO - Processing document 10-K_2025-02-28
2025-11-14 16:43:42,951 - INFO - Finished converting document 10-K_2025-02-28 in 3.41 sec.
2025-11-14 16:43:43,818 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-K_2025-02-28' --> 'data\processed_data\GILD\10-K_2025-02-28.md'


2025-11-14 16:43:44,334 - INFO - Going to convert document batch...
2025-11-14 16:43:44,335 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 16:43:45,757 - INFO - Finished converting document 10-Q_2023-05-03 in 2.02 sec.
2025-11-14 16:43:46,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-Q_2023-05-03' --> 'data\processed_data\GILD\10-Q_2023-05-03.md'


2025-11-14 16:43:46,937 - INFO - Going to convert document batch...
2025-11-14 16:43:46,938 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 16:43:48,075 - INFO - Finished converting document 10-Q_2023-08-04 in 1.88 sec.
2025-11-14 16:43:48,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-Q_2023-08-04' --> 'data\processed_data\GILD\10-Q_2023-08-04.md'


2025-11-14 16:43:50,299 - INFO - Going to convert document batch...
2025-11-14 16:43:50,301 - INFO - Processing document 10-Q_2023-11-07
2025-11-14 16:43:51,459 - INFO - Finished converting document 10-Q_2023-11-07 in 2.70 sec.
2025-11-14 16:43:52,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-Q_2023-11-07' --> 'data\processed_data\GILD\10-Q_2023-11-07.md'


2025-11-14 16:43:53,138 - INFO - Going to convert document batch...
2025-11-14 16:43:53,139 - INFO - Processing document 10-Q_2024-05-08
2025-11-14 16:43:54,390 - INFO - Finished converting document 10-Q_2024-05-08 in 2.20 sec.
2025-11-14 16:43:55,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-Q_2024-05-08' --> 'data\processed_data\GILD\10-Q_2024-05-08.md'


2025-11-14 16:43:55,772 - INFO - Going to convert document batch...
2025-11-14 16:43:55,773 - INFO - Processing document 10-Q_2024-08-08
2025-11-14 16:43:56,945 - INFO - Finished converting document 10-Q_2024-08-08 in 1.89 sec.
2025-11-14 16:43:57,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-Q_2024-08-08' --> 'data\processed_data\GILD\10-Q_2024-08-08.md'


2025-11-14 16:43:58,869 - INFO - Going to convert document batch...
2025-11-14 16:43:58,870 - INFO - Processing document 10-Q_2024-11-12
2025-11-14 16:44:00,337 - INFO - Finished converting document 10-Q_2024-11-12 in 2.69 sec.


Converted 'data\edgar_documents\GILD\10-Q_2024-11-12' --> 'data\processed_data\GILD\10-Q_2024-11-12.md'


2025-11-14 16:44:01,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:02,179 - INFO - Going to convert document batch...
2025-11-14 16:44:02,180 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 16:44:02,983 - INFO - Finished converting document 10-Q_2025-05-07 in 2.06 sec.
2025-11-14 16:44:03,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-Q_2025-05-07' --> 'data\processed_data\GILD\10-Q_2025-05-07.md'


2025-11-14 16:44:04,152 - INFO - Going to convert document batch...
2025-11-14 16:44:04,153 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 16:44:06,030 - INFO - Finished converting document 10-Q_2025-08-07 in 2.62 sec.
2025-11-14 16:44:06,698 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\10-Q_2025-08-07' --> 'data\processed_data\GILD\10-Q_2025-08-07.md'


2025-11-14 16:44:07,388 - INFO - Going to convert document batch...
2025-11-14 16:44:07,391 - INFO - Processing document 10-Q_2025-11-07
2025-11-14 16:44:08,512 - INFO - Finished converting document 10-Q_2025-11-07 in 1.89 sec.
2025-11-14 16:44:09,861 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:09,869 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\10-Q_2025-11-07' --> 'data\processed_data\GILD\10-Q_2025-11-07.md'


2025-11-14 16:44:09,871 - INFO - Processing document 4_2023-01-03
2025-11-14 16:44:09,901 - INFO - Finished converting document 4_2023-01-03 in 0.22 sec.
2025-11-14 16:44:09,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:09,995 - INFO - Going to convert document batch...
2025-11-14 16:44:09,997 - INFO - Processing document 4_2023-01-26
2025-11-14 16:44:10,039 - INFO - Finished converting document 4_2023-01-26 in 0.08 sec.
2025-11-14 16:44:10,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:10,089 - INFO - Going to convert document batch...
2025-11-14 16:44:10,091 - INFO - Processing document 4_2023-02-07
2025-11-14 16:44:10,124 - INFO - Finished converting document 4_2023-02-07 in 0.06 sec.


Converted 'data\edgar_documents\GILD\4_2023-01-03' --> 'data\processed_data\GILD\4_2023-01-03.md'
Converted 'data\edgar_documents\GILD\4_2023-01-26' --> 'data\processed_data\GILD\4_2023-01-26.md'


2025-11-14 16:44:10,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:10,191 - INFO - Going to convert document batch...
2025-11-14 16:44:10,192 - INFO - Processing document 4_2023-02-23
2025-11-14 16:44:10,217 - INFO - Finished converting document 4_2023-02-23 in 0.06 sec.
2025-11-14 16:44:10,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:10,273 - INFO - Going to convert document batch...
2025-11-14 16:44:10,273 - INFO - Processing document 4_2023-03-02
2025-11-14 16:44:10,294 - INFO - Finished converting document 4_2023-03-02 in 0.06 sec.
2025-11-14 16:44:10,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:10,336 - INFO - Going to convert document batch...
2025-11-14 16:44:10,337 - INFO - Processing document 4_2023-03-10


Converted 'data\edgar_documents\GILD\4_2023-02-07' --> 'data\processed_data\GILD\4_2023-02-07.md'
Converted 'data\edgar_documents\GILD\4_2023-02-23' --> 'data\processed_data\GILD\4_2023-02-23.md'
Converted 'data\edgar_documents\GILD\4_2023-03-02' --> 'data\processed_data\GILD\4_2023-03-02.md'


2025-11-14 16:44:10,381 - INFO - Finished converting document 4_2023-03-10 in 0.06 sec.
2025-11-14 16:44:10,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:10,486 - INFO - Going to convert document batch...
2025-11-14 16:44:10,487 - INFO - Processing document 4_2023-03-13
2025-11-14 16:44:10,541 - INFO - Finished converting document 4_2023-03-13 in 0.12 sec.
2025-11-14 16:44:10,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:10,611 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\4_2023-03-10' --> 'data\processed_data\GILD\4_2023-03-10.md'
Converted 'data\edgar_documents\GILD\4_2023-03-13' --> 'data\processed_data\GILD\4_2023-03-13.md'


2025-11-14 16:44:10,612 - INFO - Processing document 4_2023-03-14
2025-11-14 16:44:10,642 - INFO - Finished converting document 4_2023-03-14 in 0.06 sec.
2025-11-14 16:44:10,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:10,700 - INFO - Going to convert document batch...
2025-11-14 16:44:10,701 - INFO - Processing document 4_2023-03-31
2025-11-14 16:44:10,781 - INFO - Finished converting document 4_2023-03-31 in 0.11 sec.


Converted 'data\edgar_documents\GILD\4_2023-03-14' --> 'data\processed_data\GILD\4_2023-03-14.md'
Converted 'data\edgar_documents\GILD\4_2023-03-31' --> 'data\processed_data\GILD\4_2023-03-31.md'


2025-11-14 16:44:10,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:10,886 - INFO - Going to convert document batch...
2025-11-14 16:44:10,887 - INFO - Processing document 4_2023-05-02
2025-11-14 16:44:10,915 - INFO - Finished converting document 4_2023-05-02 in 0.09 sec.
2025-11-14 16:44:10,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:10,967 - INFO - Going to convert document batch...
2025-11-14 16:44:10,967 - INFO - Processing document 4_2023-05-04
2025-11-14 16:44:11,004 - INFO - Finished converting document 4_2023-05-04 in 0.06 sec.
2025-11-14 16:44:11,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:11,062 - INFO - Going to convert document batch...
2025-11-14 16:44:11,063 - INFO - Processing document 4_2023-06-12
2025-11-14 16:44:11,088 - INFO - Finished converting document 4_2023-06-12 in 0.06 sec.


Converted 'data\edgar_documents\GILD\4_2023-05-02' --> 'data\processed_data\GILD\4_2023-05-02.md'
Converted 'data\edgar_documents\GILD\4_2023-05-04' --> 'data\processed_data\GILD\4_2023-05-04.md'
Converted 'data\edgar_documents\GILD\4_2023-06-12' --> 'data\processed_data\GILD\4_2023-06-12.md'


2025-11-14 16:44:11,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:11,158 - INFO - Going to convert document batch...
2025-11-14 16:44:11,159 - INFO - Processing document 4_2023-06-14
2025-11-14 16:44:11,194 - INFO - Finished converting document 4_2023-06-14 in 0.08 sec.
2025-11-14 16:44:11,270 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:11,280 - INFO - Going to convert document batch...
2025-11-14 16:44:11,280 - INFO - Processing document 4_2023-06-28
2025-11-14 16:44:11,303 - INFO - Finished converting document 4_2023-06-28 in 0.06 sec.
2025-11-14 16:44:11,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:11,358 - INFO - Going to convert document batch...
2025-11-14 16:44:11,358 - INFO - Processing document 4_2023-06-30
2025-11-14 16:44:11,382 - INFO - Finished converting document 4_2023-06-30 in 0.05 sec.
2025-11-14 16:44:11,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\4_2023-06-14' --> 'data\processed_data\GILD\4_2023-06-14.md'
Converted 'data\edgar_documents\GILD\4_2023-06-28' --> 'data\processed_data\GILD\4_2023-06-28.md'
Converted 'data\edgar_documents\GILD\4_2023-06-30' --> 'data\processed_data\GILD\4_2023-06-30.md'


2025-11-14 16:44:11,433 - INFO - Going to convert document batch...
2025-11-14 16:44:11,434 - INFO - Processing document 4_2023-07-21
2025-11-14 16:44:11,464 - INFO - Finished converting document 4_2023-07-21 in 0.06 sec.
2025-11-14 16:44:11,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:11,519 - INFO - Going to convert document batch...
2025-11-14 16:44:11,519 - INFO - Processing document 4_2023-07-25
2025-11-14 16:44:11,542 - INFO - Finished converting document 4_2023-07-25 in 0.05 sec.
2025-11-14 16:44:11,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:11,606 - INFO - Going to convert document batch...
2025-11-14 16:44:11,608 - INFO - Processing document 4_2023-07-26
2025-11-14 16:44:11,637 - INFO - Finished converting document 4_2023-07-26 in 0.08 sec.
2025-11-14 16:44:11,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:11,691 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\4_2023-07-21' --> 'data\processed_data\GILD\4_2023-07-21.md'
Converted 'data\edgar_documents\GILD\4_2023-07-25' --> 'data\processed_data\GILD\4_2023-07-25.md'
Converted 'data\edgar_documents\GILD\4_2023-07-26' --> 'data\processed_data\GILD\4_2023-07-26.md'


2025-11-14 16:44:11,692 - INFO - Processing document 4_2023-08-11
2025-11-14 16:44:11,713 - INFO - Finished converting document 4_2023-08-11 in 0.05 sec.
2025-11-14 16:44:11,768 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:44:11,769 - ERROR - Input document 4_2023-09-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:44:11,770 - INFO - Going to convert document batch...
2025-11-14 16:44:11,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44

Converted 'data\edgar_documents\GILD\4_2023-08-11' --> 'data\processed_data\GILD\4_2023-08-11.md'
Error processing data\edgar_documents\GILD\4_2023-09-07: File format not allowed: data\edgar_documents\GILD\4_2023-09-07
Converted 'data\edgar_documents\GILD\4_2023-09-11' --> 'data\processed_data\GILD\4_2023-09-11.md'
Converted 'data\edgar_documents\GILD\4_2023-09-13' --> 'data\processed_data\GILD\4_2023-09-13.md'


2025-11-14 16:44:11,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:11,966 - INFO - Going to convert document batch...
2025-11-14 16:44:11,967 - INFO - Processing document 4_2023-09-29
2025-11-14 16:44:12,090 - INFO - Finished converting document 4_2023-09-29 in 0.17 sec.
2025-11-14 16:44:12,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:12,152 - INFO - Going to convert document batch...
2025-11-14 16:44:12,153 - INFO - Processing document 4_2023-10-18
2025-11-14 16:44:12,176 - INFO - Finished converting document 4_2023-10-18 in 0.05 sec.
2025-11-14 16:44:12,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:12,222 - INFO - Going to convert document batch...
2025-11-14 16:44:12,223 - INFO - Processing document 4_2023-10-26
2025-11-14 16:44:12,243 - INFO - Finished converting document 4_2023-10-26 in 0.05 sec.
2025-11-14 16:44:12,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GILD\4_2023-09-29' --> 'data\processed_data\GILD\4_2023-09-29.md'
Converted 'data\edgar_documents\GILD\4_2023-10-18' --> 'data\processed_data\GILD\4_2023-10-18.md'
Converted 'data\edgar_documents\GILD\4_2023-10-26' --> 'data\processed_data\GILD\4_2023-10-26.md'


2025-11-14 16:44:12,327 - INFO - Finished converting document 4_2023-11-13 in 0.06 sec.
2025-11-14 16:44:12,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:12,376 - INFO - Going to convert document batch...
2025-11-14 16:44:12,376 - INFO - Processing document 4_2023-12-11
2025-11-14 16:44:12,406 - INFO - Finished converting document 4_2023-12-11 in 0.06 sec.
2025-11-14 16:44:12,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:12,469 - INFO - Going to convert document batch...
2025-11-14 16:44:12,470 - INFO - Processing document 4_2023-12-29
2025-11-14 16:44:12,495 - INFO - Finished converting document 4_2023-12-29 in 0.06 sec.
2025-11-14 16:44:12,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\4_2023-11-13' --> 'data\processed_data\GILD\4_2023-11-13.md'
Converted 'data\edgar_documents\GILD\4_2023-12-11' --> 'data\processed_data\GILD\4_2023-12-11.md'
Converted 'data\edgar_documents\GILD\4_2023-12-29' --> 'data\processed_data\GILD\4_2023-12-29.md'


2025-11-14 16:44:12,541 - INFO - Going to convert document batch...
2025-11-14 16:44:12,542 - INFO - Processing document 4_2024-01-10
2025-11-14 16:44:12,560 - INFO - Finished converting document 4_2024-01-10 in 0.05 sec.
2025-11-14 16:44:12,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:12,734 - INFO - Going to convert document batch...
2025-11-14 16:44:12,734 - INFO - Processing document 4_2024-01-17
2025-11-14 16:44:12,766 - INFO - Finished converting document 4_2024-01-17 in 0.09 sec.
2025-11-14 16:44:12,818 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:12,829 - INFO - Going to convert document batch...
2025-11-14 16:44:12,830 - INFO - Processing document 4_2024-01-26
2025-11-14 16:44:12,856 - INFO - Finished converting document 4_2024-01-26 in 0.06 sec.


Converted 'data\edgar_documents\GILD\4_2024-01-10' --> 'data\processed_data\GILD\4_2024-01-10.md'
Converted 'data\edgar_documents\GILD\4_2024-01-17' --> 'data\processed_data\GILD\4_2024-01-17.md'


2025-11-14 16:44:12,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:12,905 - INFO - Going to convert document batch...
2025-11-14 16:44:12,906 - INFO - Processing document 4_2024-01-31
2025-11-14 16:44:12,931 - INFO - Finished converting document 4_2024-01-31 in 0.05 sec.
2025-11-14 16:44:12,968 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:12,981 - INFO - Going to convert document batch...
2025-11-14 16:44:12,982 - INFO - Processing document 4_2024-02-02
2025-11-14 16:44:13,007 - INFO - Finished converting document 4_2024-02-02 in 0.05 sec.
2025-11-14 16:44:13,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:13,051 - INFO - Going to convert document batch...
2025-11-14 16:44:13,052 - INFO - Processing document 4_2024-02-06


Converted 'data\edgar_documents\GILD\4_2024-01-26' --> 'data\processed_data\GILD\4_2024-01-26.md'
Converted 'data\edgar_documents\GILD\4_2024-01-31' --> 'data\processed_data\GILD\4_2024-01-31.md'
Converted 'data\edgar_documents\GILD\4_2024-02-02' --> 'data\processed_data\GILD\4_2024-02-02.md'


2025-11-14 16:44:13,075 - INFO - Finished converting document 4_2024-02-06 in 0.05 sec.
2025-11-14 16:44:13,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:13,129 - INFO - Going to convert document batch...
2025-11-14 16:44:13,130 - INFO - Processing document 4_2024-02-13
2025-11-14 16:44:13,224 - INFO - Finished converting document 4_2024-02-13 in 0.11 sec.
2025-11-14 16:44:13,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:13,291 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\4_2024-02-06' --> 'data\processed_data\GILD\4_2024-02-06.md'
Converted 'data\edgar_documents\GILD\4_2024-02-13' --> 'data\processed_data\GILD\4_2024-02-13.md'


2025-11-14 16:44:13,292 - INFO - Processing document 4_2024-02-29
2025-11-14 16:44:13,318 - INFO - Finished converting document 4_2024-02-29 in 0.05 sec.
2025-11-14 16:44:13,355 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:13,373 - INFO - Going to convert document batch...
2025-11-14 16:44:13,379 - INFO - Processing document 4_2024-03-11
2025-11-14 16:44:13,416 - INFO - Finished converting document 4_2024-03-11 in 0.06 sec.
2025-11-14 16:44:13,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:13,470 - INFO - Going to convert document batch...
2025-11-14 16:44:13,470 - INFO - Processing document 4_2024-03-12
2025-11-14 16:44:13,503 - INFO - Finished converting document 4_2024-03-12 in 0.06 sec.
2025-11-14 16:44:13,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\4_2024-02-29' --> 'data\processed_data\GILD\4_2024-02-29.md'
Converted 'data\edgar_documents\GILD\4_2024-03-11' --> 'data\processed_data\GILD\4_2024-03-11.md'
Converted 'data\edgar_documents\GILD\4_2024-03-12' --> 'data\processed_data\GILD\4_2024-03-12.md'


2025-11-14 16:44:13,556 - INFO - Going to convert document batch...
2025-11-14 16:44:13,557 - INFO - Processing document 4_2024-03-29
2025-11-14 16:44:13,586 - INFO - Finished converting document 4_2024-03-29 in 0.05 sec.
2025-11-14 16:44:13,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:13,647 - INFO - Going to convert document batch...
2025-11-14 16:44:13,648 - INFO - Processing document 4_2024-04-02
2025-11-14 16:44:13,666 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 16:44:13,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:13,714 - INFO - Going to convert document batch...
2025-11-14 16:44:13,714 - INFO - Processing document 4_2024-04-03
2025-11-14 16:44:13,743 - INFO - Finished converting document 4_2024-04-03 in 0.05 sec.
2025-11-14 16:44:13,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\4_2024-03-29' --> 'data\processed_data\GILD\4_2024-03-29.md'
Converted 'data\edgar_documents\GILD\4_2024-04-02' --> 'data\processed_data\GILD\4_2024-04-02.md'
Converted 'data\edgar_documents\GILD\4_2024-04-03' --> 'data\processed_data\GILD\4_2024-04-03.md'


2025-11-14 16:44:13,805 - INFO - Going to convert document batch...
2025-11-14 16:44:13,805 - INFO - Processing document 4_2024-04-26
2025-11-14 16:44:13,832 - INFO - Finished converting document 4_2024-04-26 in 0.06 sec.
2025-11-14 16:44:13,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:13,884 - INFO - Going to convert document batch...
2025-11-14 16:44:13,885 - INFO - Processing document 4_2024-05-09
2025-11-14 16:44:13,909 - INFO - Finished converting document 4_2024-05-09 in 0.05 sec.
2025-11-14 16:44:13,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:13,957 - INFO - Going to convert document batch...
2025-11-14 16:44:13,958 - INFO - Processing document 4_2024-06-11
2025-11-14 16:44:13,980 - INFO - Finished converting document 4_2024-06-11 in 0.05 sec.
2025-11-14 16:44:14,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,047 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\4_2024-04-26' --> 'data\processed_data\GILD\4_2024-04-26.md'
Converted 'data\edgar_documents\GILD\4_2024-05-09' --> 'data\processed_data\GILD\4_2024-05-09.md'
Converted 'data\edgar_documents\GILD\4_2024-06-11' --> 'data\processed_data\GILD\4_2024-06-11.md'


2025-11-14 16:44:14,048 - INFO - Processing document 4_2024-06-20
2025-11-14 16:44:14,075 - INFO - Finished converting document 4_2024-06-20 in 0.06 sec.
2025-11-14 16:44:14,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,134 - INFO - Going to convert document batch...
2025-11-14 16:44:14,135 - INFO - Processing document 4_2024-07-01
2025-11-14 16:44:14,153 - INFO - Finished converting document 4_2024-07-01 in 0.05 sec.
2025-11-14 16:44:14,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,197 - INFO - Going to convert document batch...
2025-11-14 16:44:14,198 - INFO - Processing document 4_2024-07-26
2025-11-14 16:44:14,226 - INFO - Finished converting document 4_2024-07-26 in 0.05 sec.
2025-11-14 16:44:14,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,281 - INFO - Going to convert document batch...
2025-11-14 16:44:14,282 - INFO - Processing document 4_2024-08-12
2025-11-14 16:44:14,303 - IN

Converted 'data\edgar_documents\GILD\4_2024-06-20' --> 'data\processed_data\GILD\4_2024-06-20.md'
Converted 'data\edgar_documents\GILD\4_2024-07-01' --> 'data\processed_data\GILD\4_2024-07-01.md'
Converted 'data\edgar_documents\GILD\4_2024-07-26' --> 'data\processed_data\GILD\4_2024-07-26.md'


2025-11-14 16:44:14,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,352 - INFO - Going to convert document batch...
2025-11-14 16:44:14,353 - INFO - Processing document 4_2024-08-14
2025-11-14 16:44:14,379 - INFO - Finished converting document 4_2024-08-14 in 0.05 sec.
2025-11-14 16:44:14,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,448 - INFO - Going to convert document batch...
2025-11-14 16:44:14,449 - INFO - Processing document 4_2024-08-29
2025-11-14 16:44:14,473 - INFO - Finished converting document 4_2024-08-29 in 0.06 sec.
2025-11-14 16:44:14,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,519 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\4_2024-08-12' --> 'data\processed_data\GILD\4_2024-08-12.md'
Converted 'data\edgar_documents\GILD\4_2024-08-14' --> 'data\processed_data\GILD\4_2024-08-14.md'
Converted 'data\edgar_documents\GILD\4_2024-08-29' --> 'data\processed_data\GILD\4_2024-08-29.md'


2025-11-14 16:44:14,519 - INFO - Processing document 4_2024-09-11
2025-11-14 16:44:14,543 - INFO - Finished converting document 4_2024-09-11 in 0.06 sec.
2025-11-14 16:44:14,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,702 - INFO - Going to convert document batch...
2025-11-14 16:44:14,703 - INFO - Processing document 4_2024-09-13
2025-11-14 16:44:14,727 - INFO - Finished converting document 4_2024-09-13 in 0.06 sec.
2025-11-14 16:44:14,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,779 - INFO - Going to convert document batch...
2025-11-14 16:44:14,780 - INFO - Processing document 4_2024-10-02
2025-11-14 16:44:14,808 - INFO - Finished converting document 4_2024-10-02 in 0.06 sec.
2025-11-14 16:44:14,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\4_2024-09-11' --> 'data\processed_data\GILD\4_2024-09-11.md'
Converted 'data\edgar_documents\GILD\4_2024-09-13' --> 'data\processed_data\GILD\4_2024-09-13.md'
Converted 'data\edgar_documents\GILD\4_2024-10-02' --> 'data\processed_data\GILD\4_2024-10-02.md'


2025-11-14 16:44:14,871 - INFO - Going to convert document batch...
2025-11-14 16:44:14,872 - INFO - Processing document 4_2024-10-28
2025-11-14 16:44:14,911 - INFO - Finished converting document 4_2024-10-28 in 0.08 sec.
2025-11-14 16:44:14,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:14,999 - INFO - Going to convert document batch...
2025-11-14 16:44:14,999 - INFO - Processing document 4_2024-11-07
2025-11-14 16:44:15,018 - INFO - Finished converting document 4_2024-11-07 in 0.06 sec.
2025-11-14 16:44:15,066 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:44:15,066 - ERROR - Input document 4_2024-11-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\GILD\4_2024-10-28' --> 'data\processed_data\GILD\4_2024-10-28.md'
Converted 'data\edgar_documents\GILD\4_2024-11-07' --> 'data\processed_data\GILD\4_2024-11-07.md'
Error processing data\edgar_documents\GILD\4_2024-11-13: File format not allowed: data\edgar_documents\GILD\4_2024-11-13
Error processing data\edgar_documents\GILD\4_2024-11-15: File format not allowed: data\edgar_documents\GILD\4_2024-11-15


2025-11-14 16:44:15,137 - INFO - Processing document 4_2024-11-27
2025-11-14 16:44:15,186 - INFO - Finished converting document 4_2024-11-27 in 0.09 sec.
2025-11-14 16:44:15,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:15,268 - INFO - Going to convert document batch...
2025-11-14 16:44:15,269 - INFO - Processing document 4_2024-11-29
2025-11-14 16:44:15,300 - INFO - Finished converting document 4_2024-11-29 in 0.08 sec.
2025-11-14 16:44:15,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:15,376 - INFO - Going to convert document batch...
2025-11-14 16:44:15,378 - INFO - Processing document 4_2024-12-03
2025-11-14 16:44:15,419 - INFO - Finished converting document 4_2024-12-03 in 0.09 sec.


Converted 'data\edgar_documents\GILD\4_2024-11-27' --> 'data\processed_data\GILD\4_2024-11-27.md'
Converted 'data\edgar_documents\GILD\4_2024-11-29' --> 'data\processed_data\GILD\4_2024-11-29.md'


2025-11-14 16:44:15,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:15,481 - INFO - Going to convert document batch...
2025-11-14 16:44:15,482 - INFO - Processing document 4_2024-12-11
2025-11-14 16:44:15,511 - INFO - Finished converting document 4_2024-12-11 in 0.06 sec.
2025-11-14 16:44:15,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:15,562 - INFO - Going to convert document batch...
2025-11-14 16:44:15,563 - INFO - Processing document 4_2024-12-16
2025-11-14 16:44:15,599 - INFO - Finished converting document 4_2024-12-16 in 0.06 sec.


Converted 'data\edgar_documents\GILD\4_2024-12-03' --> 'data\processed_data\GILD\4_2024-12-03.md'
Converted 'data\edgar_documents\GILD\4_2024-12-11' --> 'data\processed_data\GILD\4_2024-12-11.md'


2025-11-14 16:44:15,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:15,764 - INFO - Going to convert document batch...
2025-11-14 16:44:15,765 - INFO - Processing document 4_2024-12-17
2025-11-14 16:44:15,783 - INFO - Finished converting document 4_2024-12-17 in 0.05 sec.
2025-11-14 16:44:15,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:15,840 - INFO - Going to convert document batch...
2025-11-14 16:44:15,841 - INFO - Processing document 4_2024-12-19
2025-11-14 16:44:15,862 - INFO - Finished converting document 4_2024-12-19 in 0.05 sec.
2025-11-14 16:44:15,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:15,903 - INFO - Going to convert document batch...
2025-11-14 16:44:15,905 - INFO - Processing document 4_2024-12-23
2025-11-14 16:44:15,930 - INFO - Finished converting document 4_2024-12-23 in 0.05 sec.


Converted 'data\edgar_documents\GILD\4_2024-12-16' --> 'data\processed_data\GILD\4_2024-12-16.md'
Converted 'data\edgar_documents\GILD\4_2024-12-17' --> 'data\processed_data\GILD\4_2024-12-17.md'
Converted 'data\edgar_documents\GILD\4_2024-12-19' --> 'data\processed_data\GILD\4_2024-12-19.md'


2025-11-14 16:44:15,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:15,982 - INFO - Going to convert document batch...
2025-11-14 16:44:15,983 - INFO - Processing document 4_2025-01-03
2025-11-14 16:44:16,008 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 16:44:16,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\4_2024-12-23' --> 'data\processed_data\GILD\4_2024-12-23.md'
Converted 'data\edgar_documents\GILD\4_2025-01-03' --> 'data\processed_data\GILD\4_2025-01-03.md'


2025-11-14 16:44:16,153 - INFO - Going to convert document batch...
2025-11-14 16:44:16,154 - INFO - Processing document 4_2025-01-16
2025-11-14 16:44:16,180 - INFO - Finished converting document 4_2025-01-16 in 0.06 sec.
2025-11-14 16:44:16,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:16,228 - INFO - Going to convert document batch...
2025-11-14 16:44:16,228 - INFO - Processing document 4_2025-01-27
2025-11-14 16:44:16,250 - INFO - Finished converting document 4_2025-01-27 in 0.05 sec.
2025-11-14 16:44:16,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:16,304 - INFO - Going to convert document batch...
2025-11-14 16:44:16,305 - INFO - Processing document 4_2025-02-03
2025-11-14 16:44:16,335 - INFO - Finished converting document 4_2025-02-03 in 0.06 sec.
2025-11-14 16:44:16,373 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:16,385 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\4_2025-01-16' --> 'data\processed_data\GILD\4_2025-01-16.md'
Converted 'data\edgar_documents\GILD\4_2025-01-27' --> 'data\processed_data\GILD\4_2025-01-27.md'
Converted 'data\edgar_documents\GILD\4_2025-02-03' --> 'data\processed_data\GILD\4_2025-02-03.md'


2025-11-14 16:44:16,386 - INFO - Processing document 4_2025-02-06
2025-11-14 16:44:16,952 - INFO - Finished converting document 4_2025-02-06 in 0.59 sec.
2025-11-14 16:44:17,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:17,049 - INFO - Going to convert document batch...
2025-11-14 16:44:17,050 - INFO - Processing document 4_2025-02-13
2025-11-14 16:44:17,092 - INFO - Finished converting document 4_2025-02-13 in 0.12 sec.


Converted 'data\edgar_documents\GILD\4_2025-02-06' --> 'data\processed_data\GILD\4_2025-02-06.md'
Converted 'data\edgar_documents\GILD\4_2025-02-13' --> 'data\processed_data\GILD\4_2025-02-13.md'


2025-11-14 16:44:17,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:17,190 - INFO - Going to convert document batch...
2025-11-14 16:44:17,191 - INFO - Processing document 4_2025-02-19
2025-11-14 16:44:17,225 - INFO - Finished converting document 4_2025-02-19 in 0.09 sec.
2025-11-14 16:44:17,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:17,274 - INFO - Going to convert document batch...
2025-11-14 16:44:17,275 - INFO - Processing document 4_2025-02-20
2025-11-14 16:44:17,295 - INFO - Finished converting document 4_2025-02-20 in 0.05 sec.
2025-11-14 16:44:17,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:17,340 - INFO - Going to convert document batch...
2025-11-14 16:44:17,342 - INFO - Processing document 4_2025-03-12
2025-11-14 16:44:17,371 - INFO - Finished converting document 4_2025-03-12 in 0.06 sec.
2025-11-14 16:44:17,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GILD\4_2025-02-19' --> 'data\processed_data\GILD\4_2025-02-19.md'
Converted 'data\edgar_documents\GILD\4_2025-02-20' --> 'data\processed_data\GILD\4_2025-02-20.md'
Converted 'data\edgar_documents\GILD\4_2025-03-12' --> 'data\processed_data\GILD\4_2025-03-12.md'


2025-11-14 16:44:17,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:17,558 - INFO - Going to convert document batch...
2025-11-14 16:44:17,561 - INFO - Processing document 4_2025-04-16
2025-11-14 16:44:17,607 - INFO - Finished converting document 4_2025-04-16 in 0.16 sec.


Converted 'data\edgar_documents\GILD\4_2025-03-18' --> 'data\processed_data\GILD\4_2025-03-18.md'


2025-11-14 16:44:17,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:17,696 - INFO - Going to convert document batch...
2025-11-14 16:44:17,697 - INFO - Processing document 4_2025-04-28
2025-11-14 16:44:17,720 - INFO - Finished converting document 4_2025-04-28 in 0.08 sec.


Converted 'data\edgar_documents\GILD\4_2025-04-16' --> 'data\processed_data\GILD\4_2025-04-16.md'
Converted 'data\edgar_documents\GILD\4_2025-04-28' --> 'data\processed_data\GILD\4_2025-04-28.md'


2025-11-14 16:44:17,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:17,866 - INFO - Going to convert document batch...
2025-11-14 16:44:17,867 - INFO - Processing document 4_2025-05-08
2025-11-14 16:44:17,895 - INFO - Finished converting document 4_2025-05-08 in 0.08 sec.
2025-11-14 16:44:17,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:17,940 - INFO - Going to convert document batch...
2025-11-14 16:44:17,941 - INFO - Processing document 4_2025-05-16
2025-11-14 16:44:17,963 - INFO - Finished converting document 4_2025-05-16 in 0.03 sec.
2025-11-14 16:44:17,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:18,010 - INFO - Going to convert document batch...
2025-11-14 16:44:18,011 - INFO - Processing document 4_2025-05-23
2025-11-14 16:44:18,043 - INFO - Finished converting document 4_2025-05-23 in 0.06 sec.
2025-11-14 16:44:18,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GILD\4_2025-05-08' --> 'data\processed_data\GILD\4_2025-05-08.md'
Converted 'data\edgar_documents\GILD\4_2025-05-16' --> 'data\processed_data\GILD\4_2025-05-16.md'
Converted 'data\edgar_documents\GILD\4_2025-05-23' --> 'data\processed_data\GILD\4_2025-05-23.md'


2025-11-14 16:44:18,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:18,194 - INFO - Going to convert document batch...
2025-11-14 16:44:18,195 - INFO - Processing document 4_2025-06-06
2025-11-14 16:44:18,229 - INFO - Finished converting document 4_2025-06-06 in 0.08 sec.
2025-11-14 16:44:18,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:18,280 - INFO - Going to convert document batch...
2025-11-14 16:44:18,281 - INFO - Processing document 4_2025-06-11
2025-11-14 16:44:18,305 - INFO - Finished converting document 4_2025-06-11 in 0.05 sec.
2025-11-14 16:44:18,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\4_2025-06-02' --> 'data\processed_data\GILD\4_2025-06-02.md'
Converted 'data\edgar_documents\GILD\4_2025-06-06' --> 'data\processed_data\GILD\4_2025-06-06.md'
Converted 'data\edgar_documents\GILD\4_2025-06-11' --> 'data\processed_data\GILD\4_2025-06-11.md'


2025-11-14 16:44:18,350 - INFO - Going to convert document batch...
2025-11-14 16:44:18,352 - INFO - Processing document 4_2025-06-17
2025-11-14 16:44:18,374 - INFO - Finished converting document 4_2025-06-17 in 0.05 sec.
2025-11-14 16:44:18,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:18,420 - INFO - Going to convert document batch...
2025-11-14 16:44:18,421 - INFO - Processing document 4_2025-07-01
2025-11-14 16:44:18,443 - INFO - Finished converting document 4_2025-07-01 in 0.05 sec.
2025-11-14 16:44:18,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:18,491 - INFO - Going to convert document batch...
2025-11-14 16:44:18,492 - INFO - Processing document 4_2025-07-15
2025-11-14 16:44:18,515 - INFO - Finished converting document 4_2025-07-15 in 0.05 sec.
2025-11-14 16:44:18,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:18,562 - INFO - Going to convert document batch...
2025-11-14 16:44:18,562 - 

Converted 'data\edgar_documents\GILD\4_2025-06-17' --> 'data\processed_data\GILD\4_2025-06-17.md'
Converted 'data\edgar_documents\GILD\4_2025-07-01' --> 'data\processed_data\GILD\4_2025-07-01.md'
Converted 'data\edgar_documents\GILD\4_2025-07-15' --> 'data\processed_data\GILD\4_2025-07-15.md'


2025-11-14 16:44:18,590 - INFO - Finished converting document 4_2025-07-16 in 0.05 sec.
2025-11-14 16:44:18,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:18,657 - INFO - Going to convert document batch...
2025-11-14 16:44:18,659 - INFO - Processing document 4_2025-07-28
2025-11-14 16:44:18,684 - INFO - Finished converting document 4_2025-07-28 in 0.06 sec.
2025-11-14 16:44:18,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:18,749 - INFO - Going to convert document batch...
2025-11-14 16:44:18,750 - INFO - Processing document 4_2025-07-29
2025-11-14 16:44:18,782 - INFO - Finished converting document 4_2025-07-29 in 0.08 sec.
2025-11-14 16:44:18,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\4_2025-07-16' --> 'data\processed_data\GILD\4_2025-07-16.md'
Converted 'data\edgar_documents\GILD\4_2025-07-28' --> 'data\processed_data\GILD\4_2025-07-28.md'
Converted 'data\edgar_documents\GILD\4_2025-07-29' --> 'data\processed_data\GILD\4_2025-07-29.md'


2025-11-14 16:44:18,842 - INFO - Going to convert document batch...
2025-11-14 16:44:18,844 - INFO - Processing document 4_2025-08-18
2025-11-14 16:44:18,896 - INFO - Finished converting document 4_2025-08-18 in 0.09 sec.
2025-11-14 16:44:18,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,005 - INFO - Going to convert document batch...
2025-11-14 16:44:19,006 - INFO - Processing document 4_2025-08-29
2025-11-14 16:44:19,030 - INFO - Finished converting document 4_2025-08-29 in 0.09 sec.
2025-11-14 16:44:19,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,076 - INFO - Going to convert document batch...
2025-11-14 16:44:19,077 - INFO - Processing document 4_2025-09-11
2025-11-14 16:44:19,100 - INFO - Finished converting document 4_2025-09-11 in 0.05 sec.


Converted 'data\edgar_documents\GILD\4_2025-08-18' --> 'data\processed_data\GILD\4_2025-08-18.md'
Converted 'data\edgar_documents\GILD\4_2025-08-29' --> 'data\processed_data\GILD\4_2025-08-29.md'
Converted 'data\edgar_documents\GILD\4_2025-09-11' --> 'data\processed_data\GILD\4_2025-09-11.md'


2025-11-14 16:44:19,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,172 - INFO - Going to convert document batch...
2025-11-14 16:44:19,173 - INFO - Processing document 4_2025-09-16
2025-11-14 16:44:19,200 - INFO - Finished converting document 4_2025-09-16 in 0.08 sec.
2025-11-14 16:44:19,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,246 - INFO - Going to convert document batch...
2025-11-14 16:44:19,247 - INFO - Processing document 4_2025-09-23
2025-11-14 16:44:19,268 - INFO - Finished converting document 4_2025-09-23 in 0.05 sec.
2025-11-14 16:44:19,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,330 - INFO - Going to convert document batch...
2025-11-14 16:44:19,332 - INFO - Processing document 4_2025-09-30
2025-11-14 16:44:19,356 - INFO - Finished converting document 4_2025-09-30 in 0.06 sec.
2025-11-14 16:44:19,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\4_2025-09-16' --> 'data\processed_data\GILD\4_2025-09-16.md'
Converted 'data\edgar_documents\GILD\4_2025-09-23' --> 'data\processed_data\GILD\4_2025-09-23.md'
Converted 'data\edgar_documents\GILD\4_2025-09-30' --> 'data\processed_data\GILD\4_2025-09-30.md'


2025-11-14 16:44:19,413 - INFO - Going to convert document batch...
2025-11-14 16:44:19,413 - INFO - Processing document 4_2025-10-03
2025-11-14 16:44:19,446 - INFO - Finished converting document 4_2025-10-03 in 0.06 sec.
2025-11-14 16:44:19,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,496 - INFO - Going to convert document batch...
2025-11-14 16:44:19,497 - INFO - Processing document 4_2025-10-16
2025-11-14 16:44:19,517 - INFO - Finished converting document 4_2025-10-16 in 0.05 sec.
2025-11-14 16:44:19,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,562 - INFO - Going to convert document batch...
2025-11-14 16:44:19,563 - INFO - Processing document 4_2025-10-27
2025-11-14 16:44:19,589 - INFO - Finished converting document 4_2025-10-27 in 0.06 sec.
2025-11-14 16:44:19,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,636 - INFO - Going to convert document batch...
2025-11-14 16:44:19,637 - 

Converted 'data\edgar_documents\GILD\4_2025-10-03' --> 'data\processed_data\GILD\4_2025-10-03.md'
Converted 'data\edgar_documents\GILD\4_2025-10-16' --> 'data\processed_data\GILD\4_2025-10-16.md'
Converted 'data\edgar_documents\GILD\4_2025-10-27' --> 'data\processed_data\GILD\4_2025-10-27.md'


2025-11-14 16:44:19,661 - INFO - Finished converting document 4_2025-10-29 in 0.05 sec.
2025-11-14 16:44:19,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,733 - INFO - Going to convert document batch...
2025-11-14 16:44:19,734 - INFO - Processing document 8-K_2023-02-02
2025-11-14 16:44:19,760 - INFO - Finished converting document 8-K_2023-02-02 in 0.08 sec.
2025-11-14 16:44:19,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,798 - INFO - Going to convert document batch...
2025-11-14 16:44:19,799 - INFO - Processing document 8-K_2023-02-06
2025-11-14 16:44:19,817 - INFO - Finished converting document 8-K_2023-02-06 in 0.05 sec.
2025-11-14 16:44:19,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,862 - INFO - Going to convert document batch...
2025-11-14 16:44:19,863 - INFO - Processing document 8-K_2023-04-27


Converted 'data\edgar_documents\GILD\4_2025-10-29' --> 'data\processed_data\GILD\4_2025-10-29.md'
Converted 'data\edgar_documents\GILD\8-K_2023-02-02' --> 'data\processed_data\GILD\8-K_2023-02-02.md'
Converted 'data\edgar_documents\GILD\8-K_2023-02-06' --> 'data\processed_data\GILD\8-K_2023-02-06.md'


2025-11-14 16:44:19,884 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 16:44:19,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:19,943 - INFO - Going to convert document batch...
2025-11-14 16:44:19,944 - INFO - Processing document 8-K_2023-05-05
2025-11-14 16:44:19,983 - INFO - Finished converting document 8-K_2023-05-05 in 0.09 sec.
2025-11-14 16:44:20,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,085 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\8-K_2023-04-27' --> 'data\processed_data\GILD\8-K_2023-04-27.md'
Converted 'data\edgar_documents\GILD\8-K_2023-05-05' --> 'data\processed_data\GILD\8-K_2023-05-05.md'


2025-11-14 16:44:20,088 - INFO - Processing document 8-K_2023-08-03
2025-11-14 16:44:20,110 - INFO - Finished converting document 8-K_2023-08-03 in 0.11 sec.
2025-11-14 16:44:20,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,150 - INFO - Going to convert document batch...
2025-11-14 16:44:20,151 - INFO - Processing document 8-K_2023-08-16
2025-11-14 16:44:20,170 - INFO - Finished converting document 8-K_2023-08-16 in 0.05 sec.
2025-11-14 16:44:20,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,229 - INFO - Going to convert document batch...
2025-11-14 16:44:20,229 - INFO - Processing document 8-K_2023-09-14
2025-11-14 16:44:20,266 - INFO - Finished converting document 8-K_2023-09-14 in 0.08 sec.


Converted 'data\edgar_documents\GILD\8-K_2023-08-03' --> 'data\processed_data\GILD\8-K_2023-08-03.md'
Converted 'data\edgar_documents\GILD\8-K_2023-08-16' --> 'data\processed_data\GILD\8-K_2023-08-16.md'
Converted 'data\edgar_documents\GILD\8-K_2023-09-14' --> 'data\processed_data\GILD\8-K_2023-09-14.md'


2025-11-14 16:44:20,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,377 - INFO - Going to convert document batch...
2025-11-14 16:44:20,378 - INFO - Processing document 8-K_2023-11-07
2025-11-14 16:44:20,417 - INFO - Finished converting document 8-K_2023-11-07 in 0.09 sec.
2025-11-14 16:44:20,481 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,496 - INFO - Going to convert document batch...
2025-11-14 16:44:20,498 - INFO - Processing document 8-K_2024-02-02
2025-11-14 16:44:20,523 - INFO - Finished converting document 8-K_2024-02-02 in 0.08 sec.
2025-11-14 16:44:20,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,563 - INFO - Going to convert document batch...
2025-11-14 16:44:20,564 - INFO - Processing document 8-K_2024-02-06
2025-11-14 16:44:20,588 - INFO - Finished converting document 8-K_2024-02-06 in 0.06 sec.
2025-11-14 16:44:20,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\GILD\8-K_2023-11-07' --> 'data\processed_data\GILD\8-K_2023-11-07.md'
Converted 'data\edgar_documents\GILD\8-K_2024-02-02' --> 'data\processed_data\GILD\8-K_2024-02-02.md'
Converted 'data\edgar_documents\GILD\8-K_2024-02-06' --> 'data\processed_data\GILD\8-K_2024-02-06.md'


2025-11-14 16:44:20,632 - INFO - Processing document 8-K_2024-02-12
2025-11-14 16:44:20,669 - INFO - Finished converting document 8-K_2024-02-12 in 0.08 sec.
2025-11-14 16:44:20,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,725 - INFO - Going to convert document batch...
2025-11-14 16:44:20,726 - INFO - Processing document 8-K_2024-03-14
2025-11-14 16:44:20,742 - INFO - Finished converting document 8-K_2024-03-14 in 0.03 sec.
2025-11-14 16:44:20,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,778 - INFO - Going to convert document batch...
2025-11-14 16:44:20,779 - INFO - Processing document 8-K_2024-03-22
2025-11-14 16:44:20,804 - INFO - Finished converting document 8-K_2024-03-22 in 0.05 sec.
2025-11-14 16:44:20,843 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,855 - INFO - Going to convert document batch...
2025-11-14 16:44:20,856 - INFO - Processing document 8-K_2024-04-25
2025-11-14 16:

Converted 'data\edgar_documents\GILD\8-K_2024-02-12' --> 'data\processed_data\GILD\8-K_2024-02-12.md'
Converted 'data\edgar_documents\GILD\8-K_2024-03-14' --> 'data\processed_data\GILD\8-K_2024-03-14.md'
Converted 'data\edgar_documents\GILD\8-K_2024-03-22' --> 'data\processed_data\GILD\8-K_2024-03-22.md'


2025-11-14 16:44:20,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:20,937 - INFO - Going to convert document batch...
2025-11-14 16:44:20,939 - INFO - Processing document 8-K_2024-05-09
2025-11-14 16:44:20,982 - INFO - Finished converting document 8-K_2024-05-09 in 0.09 sec.
2025-11-14 16:44:21,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:21,072 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\8-K_2024-04-25' --> 'data\processed_data\GILD\8-K_2024-04-25.md'
Converted 'data\edgar_documents\GILD\8-K_2024-05-09' --> 'data\processed_data\GILD\8-K_2024-05-09.md'


2025-11-14 16:44:21,072 - INFO - Processing document 8-K_2024-07-17
2025-11-14 16:44:21,100 - INFO - Finished converting document 8-K_2024-07-17 in 0.09 sec.
2025-11-14 16:44:21,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:21,147 - INFO - Going to convert document batch...
2025-11-14 16:44:21,148 - INFO - Processing document 8-K_2024-08-08
2025-11-14 16:44:21,176 - INFO - Finished converting document 8-K_2024-08-08 in 0.06 sec.
2025-11-14 16:44:21,215 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:21,230 - INFO - Going to convert document batch...
2025-11-14 16:44:21,230 - INFO - Processing document 8-K_2024-11-06
2025-11-14 16:44:21,257 - INFO - Finished converting document 8-K_2024-11-06 in 0.06 sec.
2025-11-14 16:44:21,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:21,296 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GILD\8-K_2024-07-17' --> 'data\processed_data\GILD\8-K_2024-07-17.md'
Converted 'data\edgar_documents\GILD\8-K_2024-08-08' --> 'data\processed_data\GILD\8-K_2024-08-08.md'
Converted 'data\edgar_documents\GILD\8-K_2024-11-06' --> 'data\processed_data\GILD\8-K_2024-11-06.md'


2025-11-14 16:44:21,297 - INFO - Processing document 8-K_2024-11-20
2025-11-14 16:44:21,329 - INFO - Finished converting document 8-K_2024-11-20 in 0.06 sec.
2025-11-14 16:44:21,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:21,378 - INFO - Going to convert document batch...
2025-11-14 16:44:21,379 - INFO - Processing document 8-K_2024-12-13
2025-11-14 16:44:21,405 - INFO - Finished converting document 8-K_2024-12-13 in 0.05 sec.
2025-11-14 16:44:21,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:21,469 - INFO - Going to convert document batch...
2025-11-14 16:44:21,470 - INFO - Processing document 8-K_2025-02-11
2025-11-14 16:44:21,493 - INFO - Finished converting document 8-K_2025-02-11 in 0.06 sec.
2025-11-14 16:44:21,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:21,527 - INFO - Going to convert document batch...
2025-11-14 16:44:21,528 - INFO - Processing document 8-K_2025-03-12
2025-11-14 16:

Converted 'data\edgar_documents\GILD\8-K_2024-11-20' --> 'data\processed_data\GILD\8-K_2024-11-20.md'
Converted 'data\edgar_documents\GILD\8-K_2024-12-13' --> 'data\processed_data\GILD\8-K_2024-12-13.md'
Converted 'data\edgar_documents\GILD\8-K_2025-02-11' --> 'data\processed_data\GILD\8-K_2025-02-11.md'


2025-11-14 16:44:21,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\8-K_2025-03-12' --> 'data\processed_data\GILD\8-K_2025-03-12.md'


2025-11-14 16:44:21,931 - INFO - Going to convert document batch...
2025-11-14 16:44:21,932 - INFO - Processing document 8-K_2025-04-24
2025-11-14 16:44:21,957 - INFO - Finished converting document 8-K_2025-04-24 in 0.39 sec.
2025-11-14 16:44:21,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:22,010 - INFO - Going to convert document batch...
2025-11-14 16:44:22,011 - INFO - Processing document 8-K_2025-05-08
2025-11-14 16:44:22,062 - INFO - Finished converting document 8-K_2025-05-08 in 0.09 sec.
2025-11-14 16:44:22,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:22,140 - INFO - Going to convert document batch...
2025-11-14 16:44:22,141 - INFO - Processing document 8-K_2025-08-04


Converted 'data\edgar_documents\GILD\8-K_2025-04-24' --> 'data\processed_data\GILD\8-K_2025-04-24.md'
Converted 'data\edgar_documents\GILD\8-K_2025-05-08' --> 'data\processed_data\GILD\8-K_2025-05-08.md'


2025-11-14 16:44:22,159 - INFO - Finished converting document 8-K_2025-08-04 in 0.08 sec.
2025-11-14 16:44:22,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:22,197 - INFO - Going to convert document batch...
2025-11-14 16:44:22,198 - INFO - Processing document 8-K_2025-08-07
2025-11-14 16:44:22,229 - INFO - Finished converting document 8-K_2025-08-07 in 0.06 sec.
2025-11-14 16:44:22,257 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:22,267 - INFO - Going to convert document batch...
2025-11-14 16:44:22,267 - INFO - Processing document 8-K_2025-08-14
2025-11-14 16:44:22,282 - INFO - Finished converting document 8-K_2025-08-14 in 0.05 sec.
2025-11-14 16:44:22,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:44:22,314 - INFO - Going to convert document batch...
2025-11-14 16:44:22,315 - INFO - Processing document 8-K_2025-10-06
2025-11-14 16:44:22,332 - INFO - Finished converting document 8-K_2025-10-06 in 0.

Converted 'data\edgar_documents\GILD\8-K_2025-08-04' --> 'data\processed_data\GILD\8-K_2025-08-04.md'
Converted 'data\edgar_documents\GILD\8-K_2025-08-07' --> 'data\processed_data\GILD\8-K_2025-08-07.md'
Converted 'data\edgar_documents\GILD\8-K_2025-08-14' --> 'data\processed_data\GILD\8-K_2025-08-14.md'
Converted 'data\edgar_documents\GILD\8-K_2025-10-06' --> 'data\processed_data\GILD\8-K_2025-10-06.md'


2025-11-14 16:44:22,365 - INFO - Processing document 8-K_2025-10-30
2025-11-14 16:44:22,389 - INFO - Finished converting document 8-K_2025-10-30 in 0.05 sec.
2025-11-14 16:44:22,508 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:44:22,509 - ERROR - Input document DEF-14A_2023-03-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:44:22,512 - INFO - Going to convert document batch...
2025-11-14 16:44:22,565 - INFO - detected formats:

Converted 'data\edgar_documents\GILD\8-K_2025-10-30' --> 'data\processed_data\GILD\8-K_2025-10-30.md'
Error processing data\edgar_documents\GILD\DEF-14A_2023-03-23: File format not allowed: data\edgar_documents\GILD\DEF-14A_2023-03-23


2025-11-14 16:44:23,139 - INFO - Going to convert document batch...
2025-11-14 16:44:23,140 - INFO - Processing document DEF-14A_2024-03-28
2025-11-14 16:44:25,287 - INFO - Finished converting document DEF-14A_2024-03-28 in 2.77 sec.
2025-11-14 16:44:26,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\DEF-14A_2024-03-28' --> 'data\processed_data\GILD\DEF-14A_2024-03-28.md'


2025-11-14 16:44:27,801 - INFO - Going to convert document batch...
2025-11-14 16:44:27,802 - INFO - Processing document DEF-14A_2025-03-27
2025-11-14 16:44:29,674 - INFO - Finished converting document DEF-14A_2025-03-27 in 2.95 sec.
2025-11-14 16:44:31,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GILD\DEF-14A_2025-03-27' --> 'data\processed_data\GILD\DEF-14A_2025-03-27.md'
Processed 139 new files. Errors: 4
Found 96 files to process in data\edgar_documents\GM


2025-11-14 16:44:33,199 - INFO - Going to convert document batch...
2025-11-14 16:44:33,200 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:44:33,201 - INFO - Processing document 10-K_2023-01-31
2025-11-14 16:44:35,935 - INFO - Finished converting document 10-K_2023-01-31 in 4.80 sec.
2025-11-14 16:44:37,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-K_2023-01-31' --> 'data\processed_data\GM\10-K_2023-01-31.md'


2025-11-14 16:44:38,838 - INFO - Going to convert document batch...
2025-11-14 16:44:38,840 - INFO - Processing document 10-K_2024-01-30
2025-11-14 16:44:41,791 - INFO - Finished converting document 10-K_2024-01-30 in 4.88 sec.
2025-11-14 16:44:42,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-K_2024-01-30' --> 'data\processed_data\GM\10-K_2024-01-30.md'


2025-11-14 16:44:44,916 - INFO - Going to convert document batch...
2025-11-14 16:44:44,917 - INFO - Processing document 10-K_2025-01-28
2025-11-14 16:44:48,172 - INFO - Finished converting document 10-K_2025-01-28 in 5.42 sec.
2025-11-14 16:44:49,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-K_2025-01-28' --> 'data\processed_data\GM\10-K_2025-01-28.md'


2025-11-14 16:44:50,667 - INFO - Going to convert document batch...
2025-11-14 16:44:50,668 - INFO - Processing document 10-Q_2023-04-25
2025-11-14 16:44:52,032 - INFO - Finished converting document 10-Q_2023-04-25 in 2.19 sec.
2025-11-14 16:44:52,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-Q_2023-04-25' --> 'data\processed_data\GM\10-Q_2023-04-25.md'


2025-11-14 16:44:54,154 - INFO - Going to convert document batch...
2025-11-14 16:44:54,155 - INFO - Processing document 10-Q_2023-07-25
2025-11-14 16:44:55,886 - INFO - Finished converting document 10-Q_2023-07-25 in 3.20 sec.
2025-11-14 16:44:56,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-Q_2023-07-25' --> 'data\processed_data\GM\10-Q_2023-07-25.md'


2025-11-14 16:44:57,970 - INFO - Going to convert document batch...
2025-11-14 16:44:57,971 - INFO - Processing document 10-Q_2023-10-24
2025-11-14 16:44:59,637 - INFO - Finished converting document 10-Q_2023-10-24 in 3.02 sec.
2025-11-14 16:45:01,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-Q_2023-10-24' --> 'data\processed_data\GM\10-Q_2023-10-24.md'


2025-11-14 16:45:01,874 - INFO - Going to convert document batch...
2025-11-14 16:45:01,875 - INFO - Processing document 10-Q_2024-04-23
2025-11-14 16:45:03,353 - INFO - Finished converting document 10-Q_2024-04-23 in 2.24 sec.
2025-11-14 16:45:04,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-Q_2024-04-23' --> 'data\processed_data\GM\10-Q_2024-04-23.md'


2025-11-14 16:45:05,250 - INFO - Going to convert document batch...
2025-11-14 16:45:05,250 - INFO - Processing document 10-Q_2024-07-23
2025-11-14 16:45:06,874 - INFO - Finished converting document 10-Q_2024-07-23 in 2.86 sec.
2025-11-14 16:45:08,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-Q_2024-07-23' --> 'data\processed_data\GM\10-Q_2024-07-23.md'


2025-11-14 16:45:09,208 - INFO - Going to convert document batch...
2025-11-14 16:45:09,209 - INFO - Processing document 10-Q_2024-10-22
2025-11-14 16:45:11,259 - INFO - Finished converting document 10-Q_2024-10-22 in 2.98 sec.
2025-11-14 16:45:12,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-Q_2024-10-22' --> 'data\processed_data\GM\10-Q_2024-10-22.md'


2025-11-14 16:45:12,837 - INFO - Going to convert document batch...
2025-11-14 16:45:12,838 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 16:45:14,287 - INFO - Finished converting document 10-Q_2025-05-01 in 2.22 sec.
2025-11-14 16:45:15,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-Q_2025-05-01' --> 'data\processed_data\GM\10-Q_2025-05-01.md'


2025-11-14 16:45:16,507 - INFO - Going to convert document batch...
2025-11-14 16:45:16,509 - INFO - Processing document 10-Q_2025-07-22
2025-11-14 16:45:18,355 - INFO - Finished converting document 10-Q_2025-07-22 in 3.39 sec.
2025-11-14 16:45:19,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\10-Q_2025-07-22' --> 'data\processed_data\GM\10-Q_2025-07-22.md'


2025-11-14 16:45:20,350 - INFO - Going to convert document batch...
2025-11-14 16:45:20,351 - INFO - Processing document 10-Q_2025-10-21
2025-11-14 16:45:22,062 - INFO - Finished converting document 10-Q_2025-10-21 in 2.92 sec.
2025-11-14 16:45:22,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:22,924 - INFO - Going to convert document batch...
2025-11-14 16:45:22,925 - INFO - Processing document 4_2023-01-04
2025-11-14 16:45:22,955 - INFO - Finished converting document 4_2023-01-04 in 0.08 sec.
2025-11-14 16:45:23,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:23,035 - INFO - Going to convert document batch...
2025-11-14 16:45:23,036 - INFO - Processing document 4_2023-02-06


Converted 'data\edgar_documents\GM\10-Q_2025-10-21' --> 'data\processed_data\GM\10-Q_2025-10-21.md'
Converted 'data\edgar_documents\GM\4_2023-01-04' --> 'data\processed_data\GM\4_2023-01-04.md'


2025-11-14 16:45:23,596 - INFO - Finished converting document 4_2023-02-06 in 0.61 sec.
2025-11-14 16:45:23,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:23,677 - INFO - Going to convert document batch...
2025-11-14 16:45:23,679 - INFO - Processing document 4_2023-02-09
2025-11-14 16:45:23,702 - INFO - Finished converting document 4_2023-02-09 in 0.08 sec.
2025-11-14 16:45:23,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:23,749 - INFO - Going to convert document batch...
2025-11-14 16:45:23,749 - INFO - Processing document 4_2023-02-13
2025-11-14 16:45:23,777 - INFO - Finished converting document 4_2023-02-13 in 0.06 sec.
2025-11-14 16:45:23,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\4_2023-02-06' --> 'data\processed_data\GM\4_2023-02-06.md'
Converted 'data\edgar_documents\GM\4_2023-02-09' --> 'data\processed_data\GM\4_2023-02-09.md'
Converted 'data\edgar_documents\GM\4_2023-02-13' --> 'data\processed_data\GM\4_2023-02-13.md'


2025-11-14 16:45:23,837 - INFO - Going to convert document batch...
2025-11-14 16:45:23,838 - INFO - Processing document 4_2023-02-14
2025-11-14 16:45:23,866 - INFO - Finished converting document 4_2023-02-14 in 0.06 sec.
2025-11-14 16:45:23,906 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:23,916 - INFO - Going to convert document batch...
2025-11-14 16:45:23,917 - INFO - Processing document 4_2023-05-22
2025-11-14 16:45:23,937 - INFO - Finished converting document 4_2023-05-22 in 0.05 sec.
2025-11-14 16:45:23,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:23,987 - INFO - Going to convert document batch...
2025-11-14 16:45:23,988 - INFO - Processing document 4_2023-07-05
2025-11-14 16:45:24,013 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 16:45:24,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,075 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GM\4_2023-02-14' --> 'data\processed_data\GM\4_2023-02-14.md'
Converted 'data\edgar_documents\GM\4_2023-05-22' --> 'data\processed_data\GM\4_2023-05-22.md'
Converted 'data\edgar_documents\GM\4_2023-07-05' --> 'data\processed_data\GM\4_2023-07-05.md'


2025-11-14 16:45:24,075 - INFO - Processing document 4_2023-07-14
2025-11-14 16:45:24,184 - INFO - Finished converting document 4_2023-07-14 in 0.14 sec.
2025-11-14 16:45:24,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,273 - INFO - Going to convert document batch...
2025-11-14 16:45:24,273 - INFO - Processing document 4_2023-08-11
2025-11-14 16:45:24,297 - INFO - Finished converting document 4_2023-08-11 in 0.06 sec.
2025-11-14 16:45:24,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,353 - INFO - Going to convert document batch...
2025-11-14 16:45:24,354 - INFO - Processing document 4_2023-12-05
2025-11-14 16:45:24,376 - INFO - Finished converting document 4_2023-12-05 in 0.06 sec.
2025-11-14 16:45:24,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,419 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GM\4_2023-07-14' --> 'data\processed_data\GM\4_2023-07-14.md'
Converted 'data\edgar_documents\GM\4_2023-08-11' --> 'data\processed_data\GM\4_2023-08-11.md'
Converted 'data\edgar_documents\GM\4_2023-12-05' --> 'data\processed_data\GM\4_2023-12-05.md'


2025-11-14 16:45:24,420 - INFO - Processing document 4_2023-12-15
2025-11-14 16:45:24,440 - INFO - Finished converting document 4_2023-12-15 in 0.05 sec.
2025-11-14 16:45:24,482 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,493 - INFO - Going to convert document batch...
2025-11-14 16:45:24,493 - INFO - Processing document 4_2024-01-03
2025-11-14 16:45:24,520 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 16:45:24,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,579 - INFO - Going to convert document batch...
2025-11-14 16:45:24,580 - INFO - Processing document 4_2024-02-08
2025-11-14 16:45:24,607 - INFO - Finished converting document 4_2024-02-08 in 0.06 sec.
2025-11-14 16:45:24,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,652 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GM\4_2023-12-15' --> 'data\processed_data\GM\4_2023-12-15.md'
Converted 'data\edgar_documents\GM\4_2024-01-03' --> 'data\processed_data\GM\4_2024-01-03.md'
Converted 'data\edgar_documents\GM\4_2024-02-08' --> 'data\processed_data\GM\4_2024-02-08.md'


2025-11-14 16:45:24,653 - INFO - Processing document 4_2024-02-21
2025-11-14 16:45:24,683 - INFO - Finished converting document 4_2024-02-21 in 0.06 sec.
2025-11-14 16:45:24,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,746 - INFO - Going to convert document batch...
2025-11-14 16:45:24,748 - INFO - Processing document 4_2024-02-28
2025-11-14 16:45:24,769 - INFO - Finished converting document 4_2024-02-28 in 0.05 sec.
2025-11-14 16:45:24,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,811 - INFO - Going to convert document batch...
2025-11-14 16:45:24,811 - INFO - Processing document 4_2024-03-22
2025-11-14 16:45:24,830 - INFO - Finished converting document 4_2024-03-22 in 0.05 sec.
2025-11-14 16:45:24,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,884 - INFO - Going to convert document batch...
2025-11-14 16:45:24,885 - INFO - Processing document 4_2024-04-01
2025-11-14 16:45:24,905 - IN

Converted 'data\edgar_documents\GM\4_2024-02-21' --> 'data\processed_data\GM\4_2024-02-21.md'
Converted 'data\edgar_documents\GM\4_2024-02-28' --> 'data\processed_data\GM\4_2024-02-28.md'
Converted 'data\edgar_documents\GM\4_2024-03-22' --> 'data\processed_data\GM\4_2024-03-22.md'


2025-11-14 16:45:24,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:24,953 - INFO - Going to convert document batch...
2025-11-14 16:45:24,954 - INFO - Processing document 4_2024-05-30
2025-11-14 16:45:24,976 - INFO - Finished converting document 4_2024-05-30 in 0.05 sec.
2025-11-14 16:45:25,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:25,037 - INFO - Going to convert document batch...
2025-11-14 16:45:25,038 - INFO - Processing document 4_2024-06-04
2025-11-14 16:45:25,059 - INFO - Finished converting document 4_2024-06-04 in 0.06 sec.
2025-11-14 16:45:25,097 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:25,110 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GM\4_2024-04-01' --> 'data\processed_data\GM\4_2024-04-01.md'
Converted 'data\edgar_documents\GM\4_2024-05-30' --> 'data\processed_data\GM\4_2024-05-30.md'
Converted 'data\edgar_documents\GM\4_2024-06-04' --> 'data\processed_data\GM\4_2024-06-04.md'


2025-11-14 16:45:25,110 - INFO - Processing document 4_2024-06-11
2025-11-14 16:45:25,130 - INFO - Finished converting document 4_2024-06-11 in 0.05 sec.
2025-11-14 16:45:25,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:25,284 - INFO - Going to convert document batch...
2025-11-14 16:45:25,286 - INFO - Processing document 4_2024-06-12
2025-11-14 16:45:25,309 - INFO - Finished converting document 4_2024-06-12 in 0.11 sec.
2025-11-14 16:45:25,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:25,357 - INFO - Going to convert document batch...
2025-11-14 16:45:25,358 - INFO - Processing document 4_2024-07-29
2025-11-14 16:45:25,378 - INFO - Finished converting document 4_2024-07-29 in 0.05 sec.


Converted 'data\edgar_documents\GM\4_2024-06-11' --> 'data\processed_data\GM\4_2024-06-11.md'
Converted 'data\edgar_documents\GM\4_2024-06-12' --> 'data\processed_data\GM\4_2024-06-12.md'


2025-11-14 16:45:25,413 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:25,428 - INFO - Going to convert document batch...
2025-11-14 16:45:25,429 - INFO - Processing document 4_2024-08-01
2025-11-14 16:45:25,469 - INFO - Finished converting document 4_2024-08-01 in 0.06 sec.
2025-11-14 16:45:25,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:25,518 - INFO - Going to convert document batch...
2025-11-14 16:45:25,519 - INFO - Processing document 4_2024-08-20
2025-11-14 16:45:25,541 - INFO - Finished converting document 4_2024-08-20 in 0.05 sec.
2025-11-14 16:45:25,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:25,587 - INFO - Going to convert document batch...
2025-11-14 16:45:25,588 - INFO - Processing document 4_2024-08-27


Converted 'data\edgar_documents\GM\4_2024-07-29' --> 'data\processed_data\GM\4_2024-07-29.md'
Converted 'data\edgar_documents\GM\4_2024-08-01' --> 'data\processed_data\GM\4_2024-08-01.md'
Converted 'data\edgar_documents\GM\4_2024-08-20' --> 'data\processed_data\GM\4_2024-08-20.md'


2025-11-14 16:45:25,613 - INFO - Finished converting document 4_2024-08-27 in 0.05 sec.
2025-11-14 16:45:25,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:25,676 - INFO - Going to convert document batch...
2025-11-14 16:45:25,677 - INFO - Processing document 4_2024-10-24
2025-11-14 16:45:25,714 - INFO - Finished converting document 4_2024-10-24 in 0.08 sec.
2025-11-14 16:45:25,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:25,766 - INFO - Going to convert document batch...
2025-11-14 16:45:25,767 - INFO - Processing document 4_2024-11-08
2025-11-14 16:45:25,792 - INFO - Finished converting document 4_2024-11-08 in 0.06 sec.
2025-11-14 16:45:25,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\4_2024-08-27' --> 'data\processed_data\GM\4_2024-08-27.md'
Converted 'data\edgar_documents\GM\4_2024-10-24' --> 'data\processed_data\GM\4_2024-10-24.md'
Converted 'data\edgar_documents\GM\4_2024-11-08' --> 'data\processed_data\GM\4_2024-11-08.md'


2025-11-14 16:45:25,846 - INFO - Going to convert document batch...
2025-11-14 16:45:25,847 - INFO - Processing document 4_2024-11-12
2025-11-14 16:45:25,949 - INFO - Finished converting document 4_2024-11-12 in 0.12 sec.
2025-11-14 16:45:26,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:26,061 - INFO - Going to convert document batch...
2025-11-14 16:45:26,062 - INFO - Processing document 4_2024-11-19
2025-11-14 16:45:26,103 - INFO - Finished converting document 4_2024-11-19 in 0.11 sec.
2025-11-14 16:45:26,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:26,166 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GM\4_2024-11-12' --> 'data\processed_data\GM\4_2024-11-12.md'
Converted 'data\edgar_documents\GM\4_2024-11-19' --> 'data\processed_data\GM\4_2024-11-19.md'


2025-11-14 16:45:26,167 - INFO - Processing document 4_2024-11-20
2025-11-14 16:45:26,217 - INFO - Finished converting document 4_2024-11-20 in 0.08 sec.
2025-11-14 16:45:26,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:26,313 - INFO - Going to convert document batch...
2025-11-14 16:45:26,314 - INFO - Processing document 4_2024-11-27
2025-11-14 16:45:26,337 - INFO - Finished converting document 4_2024-11-27 in 0.08 sec.
2025-11-14 16:45:26,373 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:26,384 - INFO - Going to convert document batch...
2025-11-14 16:45:26,385 - INFO - Processing document 4_2025-01-03
2025-11-14 16:45:26,408 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.


Converted 'data\edgar_documents\GM\4_2024-11-20' --> 'data\processed_data\GM\4_2024-11-20.md'
Converted 'data\edgar_documents\GM\4_2024-11-27' --> 'data\processed_data\GM\4_2024-11-27.md'


2025-11-14 16:45:26,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:26,465 - INFO - Going to convert document batch...
2025-11-14 16:45:26,466 - INFO - Processing document 4_2025-01-30
2025-11-14 16:45:26,498 - INFO - Finished converting document 4_2025-01-30 in 0.06 sec.
2025-11-14 16:45:26,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:26,556 - INFO - Going to convert document batch...
2025-11-14 16:45:26,557 - INFO - Processing document 4_2025-02-06
2025-11-14 16:45:26,577 - INFO - Finished converting document 4_2025-02-06 in 0.05 sec.
2025-11-14 16:45:26,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\4_2025-01-03' --> 'data\processed_data\GM\4_2025-01-03.md'
Converted 'data\edgar_documents\GM\4_2025-01-30' --> 'data\processed_data\GM\4_2025-01-30.md'
Converted 'data\edgar_documents\GM\4_2025-02-06' --> 'data\processed_data\GM\4_2025-02-06.md'


2025-11-14 16:45:26,638 - INFO - Going to convert document batch...
2025-11-14 16:45:26,639 - INFO - Processing document 4_2025-02-10
2025-11-14 16:45:26,677 - INFO - Finished converting document 4_2025-02-10 in 0.08 sec.
2025-11-14 16:45:26,777 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:45:26,778 - ERROR - Input document 4_2025-05-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:45:26,780 - INFO - Going to convert document batch...
2025-11-14 16:45:26,802 - IN

Converted 'data\edgar_documents\GM\4_2025-02-10' --> 'data\processed_data\GM\4_2025-02-10.md'
Error processing data\edgar_documents\GM\4_2025-05-05: File format not allowed: data\edgar_documents\GM\4_2025-05-05
Error processing data\edgar_documents\GM\4_2025-05-06: File format not allowed: data\edgar_documents\GM\4_2025-05-06
Converted 'data\edgar_documents\GM\4_2025-07-31' --> 'data\processed_data\GM\4_2025-07-31.md'


2025-11-14 16:45:26,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:26,942 - INFO - Going to convert document batch...
2025-11-14 16:45:26,943 - INFO - Processing document 4_2025-08-07
2025-11-14 16:45:26,994 - INFO - Finished converting document 4_2025-08-07 in 0.09 sec.
2025-11-14 16:45:27,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:27,073 - INFO - Going to convert document batch...
2025-11-14 16:45:27,074 - INFO - Processing document 4_2025-08-15
2025-11-14 16:45:27,103 - INFO - Finished converting document 4_2025-08-15 in 0.06 sec.
2025-11-14 16:45:27,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:27,155 - INFO - Going to convert document batch...
2025-11-14 16:45:27,155 - INFO - Processing document 4_2025-08-29
2025-11-14 16:45:27,191 - INFO - Finished converting document 4_2025-08-29 in 0.06 sec.


Converted 'data\edgar_documents\GM\4_2025-08-07' --> 'data\processed_data\GM\4_2025-08-07.md'
Converted 'data\edgar_documents\GM\4_2025-08-15' --> 'data\processed_data\GM\4_2025-08-15.md'


2025-11-14 16:45:27,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:27,324 - INFO - Going to convert document batch...
2025-11-14 16:45:27,325 - INFO - Processing document 4_2025-09-16
2025-11-14 16:45:27,357 - INFO - Finished converting document 4_2025-09-16 in 0.14 sec.
2025-11-14 16:45:27,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\4_2025-08-29' --> 'data\processed_data\GM\4_2025-08-29.md'
Converted 'data\edgar_documents\GM\4_2025-09-16' --> 'data\processed_data\GM\4_2025-09-16.md'


2025-11-14 16:45:27,423 - INFO - Going to convert document batch...
2025-11-14 16:45:27,424 - INFO - Processing document 4_2025-09-25
2025-11-14 16:45:27,466 - INFO - Finished converting document 4_2025-09-25 in 0.08 sec.
2025-11-14 16:45:27,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:27,528 - INFO - Going to convert document batch...
2025-11-14 16:45:27,529 - INFO - Processing document 4_2025-09-26
2025-11-14 16:45:27,568 - INFO - Finished converting document 4_2025-09-26 in 0.06 sec.
2025-11-14 16:45:27,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:27,627 - INFO - Going to convert document batch...
2025-11-14 16:45:27,627 - INFO - Processing document 4_2025-09-30
2025-11-14 16:45:27,655 - INFO - Finished converting document 4_2025-09-30 in 0.06 sec.
2025-11-14 16:45:27,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\4_2025-09-25' --> 'data\processed_data\GM\4_2025-09-25.md'
Converted 'data\edgar_documents\GM\4_2025-09-26' --> 'data\processed_data\GM\4_2025-09-26.md'
Converted 'data\edgar_documents\GM\4_2025-09-30' --> 'data\processed_data\GM\4_2025-09-30.md'


2025-11-14 16:45:27,709 - INFO - Going to convert document batch...
2025-11-14 16:45:27,710 - INFO - Processing document 4_2025-10-24
2025-11-14 16:45:27,820 - INFO - Finished converting document 4_2025-10-24 in 0.14 sec.
2025-11-14 16:45:27,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:27,922 - INFO - Going to convert document batch...
2025-11-14 16:45:27,923 - INFO - Processing document 4_2025-10-30
2025-11-14 16:45:27,957 - INFO - Finished converting document 4_2025-10-30 in 0.11 sec.
2025-11-14 16:45:27,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,035 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GM\4_2025-10-24' --> 'data\processed_data\GM\4_2025-10-24.md'
Converted 'data\edgar_documents\GM\4_2025-10-30' --> 'data\processed_data\GM\4_2025-10-30.md'


2025-11-14 16:45:28,037 - INFO - Processing document 8-K_2023-01-31
2025-11-14 16:45:28,071 - INFO - Finished converting document 8-K_2023-01-31 in 0.08 sec.
2025-11-14 16:45:28,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,110 - INFO - Going to convert document batch...
2025-11-14 16:45:28,110 - INFO - Processing document 8-K_2023-02-22
2025-11-14 16:45:28,126 - INFO - Finished converting document 8-K_2023-02-22 in 0.05 sec.
2025-11-14 16:45:28,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,160 - INFO - Going to convert document batch...
2025-11-14 16:45:28,161 - INFO - Processing document 8-K_2023-03-09
2025-11-14 16:45:28,180 - INFO - Finished converting document 8-K_2023-03-09 in 0.03 sec.
2025-11-14 16:45:28,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,217 - INFO - Going to convert document batch...
2025-11-14 16:45:28,218 - INFO - Processing document 8-K_2023-03-31
2025-11-14 16:

Converted 'data\edgar_documents\GM\8-K_2023-01-31' --> 'data\processed_data\GM\8-K_2023-01-31.md'
Converted 'data\edgar_documents\GM\8-K_2023-02-22' --> 'data\processed_data\GM\8-K_2023-02-22.md'
Converted 'data\edgar_documents\GM\8-K_2023-03-09' --> 'data\processed_data\GM\8-K_2023-03-09.md'
Converted 'data\edgar_documents\GM\8-K_2023-03-31' --> 'data\processed_data\GM\8-K_2023-03-31.md'


2025-11-14 16:45:28,283 - INFO - Going to convert document batch...
2025-11-14 16:45:28,285 - INFO - Processing document 8-K_2023-04-21
2025-11-14 16:45:28,312 - INFO - Finished converting document 8-K_2023-04-21 in 0.06 sec.
2025-11-14 16:45:28,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,375 - INFO - Going to convert document batch...
2025-11-14 16:45:28,376 - INFO - Processing document 8-K_2023-04-25
2025-11-14 16:45:28,402 - INFO - Finished converting document 8-K_2023-04-25 in 0.08 sec.
2025-11-14 16:45:28,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,436 - INFO - Going to convert document batch...
2025-11-14 16:45:28,437 - INFO - Processing document 8-K_2023-05-03
2025-11-14 16:45:28,454 - INFO - Finished converting document 8-K_2023-05-03 in 0.05 sec.
2025-11-14 16:45:28,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,492 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\GM\8-K_2023-04-21' --> 'data\processed_data\GM\8-K_2023-04-21.md'
Converted 'data\edgar_documents\GM\8-K_2023-04-25' --> 'data\processed_data\GM\8-K_2023-04-25.md'
Converted 'data\edgar_documents\GM\8-K_2023-05-03' --> 'data\processed_data\GM\8-K_2023-05-03.md'


2025-11-14 16:45:28,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,554 - INFO - Going to convert document batch...
2025-11-14 16:45:28,555 - INFO - Processing document 8-K_2023-07-25
2025-11-14 16:45:28,575 - INFO - Finished converting document 8-K_2023-07-25 in 0.06 sec.
2025-11-14 16:45:28,609 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,621 - INFO - Going to convert document batch...
2025-11-14 16:45:28,622 - INFO - Processing document 8-K_2023-10-04
2025-11-14 16:45:28,653 - INFO - Finished converting document 8-K_2023-10-04 in 0.06 sec.


Converted 'data\edgar_documents\GM\8-K_2023-06-22' --> 'data\processed_data\GM\8-K_2023-06-22.md'
Converted 'data\edgar_documents\GM\8-K_2023-07-25' --> 'data\processed_data\GM\8-K_2023-07-25.md'


2025-11-14 16:45:28,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,803 - INFO - Going to convert document batch...
2025-11-14 16:45:28,804 - INFO - Processing document 8-K_2023-10-24
2025-11-14 16:45:28,825 - INFO - Finished converting document 8-K_2023-10-24 in 0.09 sec.
2025-11-14 16:45:28,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:28,886 - INFO - Going to convert document batch...
2025-11-14 16:45:28,887 - INFO - Processing document 8-K_2023-11-29


Converted 'data\edgar_documents\GM\8-K_2023-10-04' --> 'data\processed_data\GM\8-K_2023-10-04.md'
Converted 'data\edgar_documents\GM\8-K_2023-10-24' --> 'data\processed_data\GM\8-K_2023-10-24.md'


2025-11-14 16:45:29,210 - INFO - Finished converting document 8-K_2023-11-29 in 0.36 sec.
2025-11-14 16:45:29,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:29,363 - INFO - Going to convert document batch...
2025-11-14 16:45:29,365 - INFO - Processing document 8-K_2023-12-13
2025-11-14 16:45:29,384 - INFO - Finished converting document 8-K_2023-12-13 in 0.14 sec.


Converted 'data\edgar_documents\GM\8-K_2023-11-29' --> 'data\processed_data\GM\8-K_2023-11-29.md'
Converted 'data\edgar_documents\GM\8-K_2023-12-13' --> 'data\processed_data\GM\8-K_2023-12-13.md'


2025-11-14 16:45:29,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:29,469 - INFO - Going to convert document batch...
2025-11-14 16:45:29,470 - INFO - Processing document 8-K_2024-01-30
2025-11-14 16:45:29,500 - INFO - Finished converting document 8-K_2024-01-30 in 0.08 sec.
2025-11-14 16:45:29,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:29,541 - INFO - Going to convert document batch...
2025-11-14 16:45:29,541 - INFO - Processing document 8-K_2024-03-28
2025-11-14 16:45:29,562 - INFO - Finished converting document 8-K_2024-03-28 in 0.05 sec.
2025-11-14 16:45:29,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:29,604 - INFO - Going to convert document batch...
2025-11-14 16:45:29,605 - INFO - Processing document 8-K_2024-04-23
2025-11-14 16:45:29,624 - INFO - Finished converting document 8-K_2024-04-23 in 0.05 sec.
2025-11-14 16:45:29,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\GM\8-K_2024-01-30' --> 'data\processed_data\GM\8-K_2024-01-30.md'
Converted 'data\edgar_documents\GM\8-K_2024-03-28' --> 'data\processed_data\GM\8-K_2024-03-28.md'
Converted 'data\edgar_documents\GM\8-K_2024-04-23' --> 'data\processed_data\GM\8-K_2024-04-23.md'


2025-11-14 16:45:29,709 - INFO - Finished converting document 8-K_2024-06-06 in 0.06 sec.
2025-11-14 16:45:29,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:29,757 - INFO - Going to convert document batch...
2025-11-14 16:45:29,758 - INFO - Processing document 8-K_2024-06-25
2025-11-14 16:45:29,777 - INFO - Finished converting document 8-K_2024-06-25 in 0.06 sec.
2025-11-14 16:45:29,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:29,811 - INFO - Going to convert document batch...
2025-11-14 16:45:29,813 - INFO - Processing document 8-K_2024-07-23
2025-11-14 16:45:29,834 - INFO - Finished converting document 8-K_2024-07-23 in 0.05 sec.
2025-11-14 16:45:29,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:29,873 - INFO - Going to convert document batch...
2025-11-14 16:45:29,874 - INFO - Processing document 8-K_2024-09-05
2025-11-14 16:45:29,891 - INFO - Finished converting document 8-K_2024-09-05 in 0.

Converted 'data\edgar_documents\GM\8-K_2024-06-06' --> 'data\processed_data\GM\8-K_2024-06-06.md'
Converted 'data\edgar_documents\GM\8-K_2024-06-25' --> 'data\processed_data\GM\8-K_2024-06-25.md'
Converted 'data\edgar_documents\GM\8-K_2024-07-23' --> 'data\processed_data\GM\8-K_2024-07-23.md'


2025-11-14 16:45:29,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:29,931 - INFO - Going to convert document batch...
2025-11-14 16:45:29,931 - INFO - Processing document 8-K_2024-10-09
2025-11-14 16:45:29,950 - INFO - Finished converting document 8-K_2024-10-09 in 0.05 sec.
2025-11-14 16:45:29,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:29,984 - INFO - Going to convert document batch...
2025-11-14 16:45:29,985 - INFO - Processing document 8-K_2024-10-22
2025-11-14 16:45:30,015 - INFO - Finished converting document 8-K_2024-10-22 in 0.06 sec.
2025-11-14 16:45:30,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:30,055 - INFO - Going to convert document batch...
2025-11-14 16:45:30,055 - INFO - Processing document 8-K_2024-12-04
2025-11-14 16:45:30,073 - INFO - Finished converting document 8-K_2024-12-04 in 0.05 sec.


Converted 'data\edgar_documents\GM\8-K_2024-09-05' --> 'data\processed_data\GM\8-K_2024-09-05.md'
Converted 'data\edgar_documents\GM\8-K_2024-10-09' --> 'data\processed_data\GM\8-K_2024-10-09.md'
Converted 'data\edgar_documents\GM\8-K_2024-10-22' --> 'data\processed_data\GM\8-K_2024-10-22.md'
Converted 'data\edgar_documents\GM\8-K_2024-12-04' --> 'data\processed_data\GM\8-K_2024-12-04.md'


2025-11-14 16:45:30,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:30,180 - INFO - Going to convert document batch...
2025-11-14 16:45:30,181 - INFO - Processing document 8-K_2024-12-10
2025-11-14 16:45:30,214 - INFO - Finished converting document 8-K_2024-12-10 in 0.14 sec.
2025-11-14 16:45:30,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:30,300 - INFO - Going to convert document batch...
2025-11-14 16:45:30,301 - INFO - Processing document 8-K_2025-01-28
2025-11-14 16:45:30,340 - INFO - Finished converting document 8-K_2025-01-28 in 0.12 sec.
2025-11-14 16:45:30,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:30,401 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GM\8-K_2024-12-10' --> 'data\processed_data\GM\8-K_2024-12-10.md'
Converted 'data\edgar_documents\GM\8-K_2025-01-28' --> 'data\processed_data\GM\8-K_2025-01-28.md'


2025-11-14 16:45:30,403 - INFO - Processing document 8-K_2025-02-26
2025-11-14 16:45:30,432 - INFO - Finished converting document 8-K_2025-02-26 in 0.06 sec.
2025-11-14 16:45:30,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:30,479 - INFO - Going to convert document batch...
2025-11-14 16:45:30,480 - INFO - Processing document 8-K_2025-03-26
2025-11-14 16:45:30,509 - INFO - Finished converting document 8-K_2025-03-26 in 0.06 sec.
2025-11-14 16:45:30,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:30,551 - INFO - Going to convert document batch...
2025-11-14 16:45:30,552 - INFO - Processing document 8-K_2025-04-29
2025-11-14 16:45:30,573 - INFO - Finished converting document 8-K_2025-04-29 in 0.05 sec.
2025-11-14 16:45:30,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:30,620 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GM\8-K_2025-02-26' --> 'data\processed_data\GM\8-K_2025-02-26.md'
Converted 'data\edgar_documents\GM\8-K_2025-03-26' --> 'data\processed_data\GM\8-K_2025-03-26.md'
Converted 'data\edgar_documents\GM\8-K_2025-04-29' --> 'data\processed_data\GM\8-K_2025-04-29.md'


2025-11-14 16:45:30,620 - INFO - Processing document 8-K_2025-05-01
2025-11-14 16:45:30,659 - INFO - Finished converting document 8-K_2025-05-01 in 0.08 sec.
2025-11-14 16:45:30,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:30,783 - INFO - Going to convert document batch...
2025-11-14 16:45:30,785 - INFO - Processing document 8-K_2025-05-07
2025-11-14 16:45:30,825 - INFO - Finished converting document 8-K_2025-05-07 in 0.14 sec.


Converted 'data\edgar_documents\GM\8-K_2025-05-01' --> 'data\processed_data\GM\8-K_2025-05-01.md'
Converted 'data\edgar_documents\GM\8-K_2025-05-07' --> 'data\processed_data\GM\8-K_2025-05-07.md'


2025-11-14 16:45:30,898 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:30,954 - INFO - Going to convert document batch...
2025-11-14 16:45:30,955 - INFO - Processing document 8-K_2025-06-05
2025-11-14 16:45:31,003 - INFO - Finished converting document 8-K_2025-06-05 in 0.14 sec.
2025-11-14 16:45:31,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:31,095 - INFO - Going to convert document batch...
2025-11-14 16:45:31,097 - INFO - Processing document 8-K_2025-07-22
2025-11-14 16:45:31,116 - INFO - Finished converting document 8-K_2025-07-22 in 0.09 sec.
2025-11-14 16:45:31,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:31,160 - INFO - Going to convert document batch...
2025-11-14 16:45:31,161 - INFO - Processing document 8-K_2025-10-14
2025-11-14 16:45:31,191 - INFO - Finished converting document 8-K_2025-10-14 in 0.06 sec.


Converted 'data\edgar_documents\GM\8-K_2025-06-05' --> 'data\processed_data\GM\8-K_2025-06-05.md'
Converted 'data\edgar_documents\GM\8-K_2025-07-22' --> 'data\processed_data\GM\8-K_2025-07-22.md'
Converted 'data\edgar_documents\GM\8-K_2025-10-14' --> 'data\processed_data\GM\8-K_2025-10-14.md'


2025-11-14 16:45:31,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:31,238 - INFO - Going to convert document batch...
2025-11-14 16:45:31,239 - INFO - Processing document 8-K_2025-10-21
2025-11-14 16:45:31,266 - INFO - Finished converting document 8-K_2025-10-21 in 0.06 sec.
2025-11-14 16:45:31,330 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:45:31,330 - ERROR - Input document DEF-14A_2023-04-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>

Converted 'data\edgar_documents\GM\8-K_2025-10-21' --> 'data\processed_data\GM\8-K_2025-10-21.md'
Error processing data\edgar_documents\GM\DEF-14A_2023-04-28: File format not allowed: data\edgar_documents\GM\DEF-14A_2023-04-28


2025-11-14 16:45:32,691 - INFO - Going to convert document batch...
2025-11-14 16:45:32,692 - INFO - Processing document DEF-14A_2024-04-24
2025-11-14 16:45:35,021 - INFO - Finished converting document DEF-14A_2024-04-24 in 3.69 sec.


Converted 'data\edgar_documents\GM\DEF-14A_2024-04-24' --> 'data\processed_data\GM\DEF-14A_2024-04-24.md'


2025-11-14 16:45:36,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:45:37,992 - INFO - Going to convert document batch...
2025-11-14 16:45:37,994 - INFO - Processing document DEF-14A_2025-04-22
2025-11-14 16:45:42,335 - INFO - Finished converting document DEF-14A_2025-04-22 in 6.30 sec.
2025-11-14 16:45:43,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GM\DEF-14A_2025-04-22' --> 'data\processed_data\GM\DEF-14A_2025-04-22.md'
Processed 93 new files. Errors: 3
Found 287 files to process in data\edgar_documents\GOOGL


2025-11-14 16:45:44,246 - INFO - Going to convert document batch...
2025-11-14 16:45:44,247 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:45:44,248 - INFO - Processing document 10-K_2023-02-03
2025-11-14 16:45:45,955 - INFO - Finished converting document 10-K_2023-02-03 in 2.59 sec.
2025-11-14 16:45:47,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-K_2023-02-03' --> 'data\processed_data\GOOGL\10-K_2023-02-03.md'


2025-11-14 16:45:48,002 - INFO - Going to convert document batch...
2025-11-14 16:45:48,003 - INFO - Processing document 10-K_2024-01-31
2025-11-14 16:45:49,861 - INFO - Finished converting document 10-K_2024-01-31 in 2.53 sec.
2025-11-14 16:45:50,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-K_2024-01-31' --> 'data\processed_data\GOOGL\10-K_2024-01-31.md'


2025-11-14 16:45:51,606 - INFO - Going to convert document batch...
2025-11-14 16:45:51,607 - INFO - Processing document 10-K_2025-02-05
2025-11-14 16:45:53,644 - INFO - Finished converting document 10-K_2025-02-05 in 3.16 sec.
2025-11-14 16:45:54,391 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-K_2025-02-05' --> 'data\processed_data\GOOGL\10-K_2025-02-05.md'


2025-11-14 16:45:54,903 - INFO - Going to convert document batch...
2025-11-14 16:45:54,905 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 16:45:56,416 - INFO - Finished converting document 10-Q_2023-04-26 in 2.08 sec.
2025-11-14 16:45:56,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-Q_2023-04-26' --> 'data\processed_data\GOOGL\10-Q_2023-04-26.md'


2025-11-14 16:45:57,510 - INFO - Going to convert document batch...
2025-11-14 16:45:57,511 - INFO - Processing document 10-Q_2023-07-26
2025-11-14 16:45:58,651 - INFO - Finished converting document 10-Q_2023-07-26 in 1.78 sec.
2025-11-14 16:45:59,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-Q_2023-07-26' --> 'data\processed_data\GOOGL\10-Q_2023-07-26.md'


2025-11-14 16:46:00,532 - INFO - Going to convert document batch...
2025-11-14 16:46:00,533 - INFO - Processing document 10-Q_2023-10-25
2025-11-14 16:46:01,696 - INFO - Finished converting document 10-Q_2023-10-25 in 2.28 sec.
2025-11-14 16:46:02,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-Q_2023-10-25' --> 'data\processed_data\GOOGL\10-Q_2023-10-25.md'


2025-11-14 16:46:02,779 - INFO - Going to convert document batch...
2025-11-14 16:46:02,780 - INFO - Processing document 10-Q_2024-04-26
2025-11-14 16:46:03,993 - INFO - Finished converting document 10-Q_2024-04-26 in 1.62 sec.
2025-11-14 16:46:04,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-Q_2024-04-26' --> 'data\processed_data\GOOGL\10-Q_2024-04-26.md'


2025-11-14 16:46:05,173 - INFO - Going to convert document batch...
2025-11-14 16:46:05,173 - INFO - Processing document 10-Q_2024-07-24
2025-11-14 16:46:06,214 - INFO - Finished converting document 10-Q_2024-07-24 in 1.61 sec.
2025-11-14 16:46:06,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-Q_2024-07-24' --> 'data\processed_data\GOOGL\10-Q_2024-07-24.md'


2025-11-14 16:46:07,959 - INFO - Going to convert document batch...
2025-11-14 16:46:07,959 - INFO - Processing document 10-Q_2024-10-30
2025-11-14 16:46:09,002 - INFO - Finished converting document 10-Q_2024-10-30 in 2.11 sec.
2025-11-14 16:46:09,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-Q_2024-10-30' --> 'data\processed_data\GOOGL\10-Q_2024-10-30.md'


2025-11-14 16:46:10,241 - INFO - Going to convert document batch...
2025-11-14 16:46:10,242 - INFO - Processing document 10-Q_2025-04-25
2025-11-14 16:46:11,079 - INFO - Finished converting document 10-Q_2025-04-25 in 1.27 sec.
2025-11-14 16:46:11,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-Q_2025-04-25' --> 'data\processed_data\GOOGL\10-Q_2025-04-25.md'


2025-11-14 16:46:12,661 - INFO - Going to convert document batch...
2025-11-14 16:46:12,662 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 16:46:14,165 - INFO - Finished converting document 10-Q_2025-07-24 in 2.69 sec.
2025-11-14 16:46:14,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\10-Q_2025-07-24' --> 'data\processed_data\GOOGL\10-Q_2025-07-24.md'


2025-11-14 16:46:15,826 - INFO - Going to convert document batch...
2025-11-14 16:46:15,827 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 16:46:17,204 - INFO - Finished converting document 10-Q_2025-10-30 in 2.53 sec.
2025-11-14 16:46:17,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:17,788 - INFO - Going to convert document batch...
2025-11-14 16:46:17,789 - INFO - Processing document 4_2023-01-03
2025-11-14 16:46:17,823 - INFO - Finished converting document 4_2023-01-03 in 0.12 sec.


Converted 'data\edgar_documents\GOOGL\10-Q_2025-10-30' --> 'data\processed_data\GOOGL\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\GOOGL\4_2023-01-03' --> 'data\processed_data\GOOGL\4_2023-01-03.md'


2025-11-14 16:46:18,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:18,110 - INFO - Going to convert document batch...
2025-11-14 16:46:18,112 - INFO - Processing document 4_2023-01-04
2025-11-14 16:46:18,147 - INFO - Finished converting document 4_2023-01-04 in 0.28 sec.
2025-11-14 16:46:18,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:18,206 - INFO - Going to convert document batch...
2025-11-14 16:46:18,206 - INFO - Processing document 4_2023-01-06
2025-11-14 16:46:18,229 - INFO - Finished converting document 4_2023-01-06 in 0.06 sec.
2025-11-14 16:46:18,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:18,275 - INFO - Going to convert document batch...
2025-11-14 16:46:18,276 - INFO - Processing document 4_2023-01-25
2025-11-14 16:46:18,299 - INFO - Finished converting document 4_2023-01-25 in 0.05 sec.
2025-11-14 16:46:18,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GOOGL\4_2023-01-04' --> 'data\processed_data\GOOGL\4_2023-01-04.md'
Converted 'data\edgar_documents\GOOGL\4_2023-01-06' --> 'data\processed_data\GOOGL\4_2023-01-06.md'
Converted 'data\edgar_documents\GOOGL\4_2023-01-25' --> 'data\processed_data\GOOGL\4_2023-01-25.md'


2025-11-14 16:46:18,369 - INFO - Processing document 4_2023-01-26
2025-11-14 16:46:18,419 - INFO - Finished converting document 4_2023-01-26 in 0.11 sec.
2025-11-14 16:46:18,496 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:18,509 - INFO - Going to convert document batch...
2025-11-14 16:46:18,511 - INFO - Processing document 4_2023-01-27
2025-11-14 16:46:18,541 - INFO - Finished converting document 4_2023-01-27 in 0.08 sec.
2025-11-14 16:46:18,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:18,609 - INFO - Going to convert document batch...
2025-11-14 16:46:18,609 - INFO - Processing document 4_2023-02-01
2025-11-14 16:46:18,632 - INFO - Finished converting document 4_2023-02-01 in 0.05 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-01-26' --> 'data\processed_data\GOOGL\4_2023-01-26.md'
Converted 'data\edgar_documents\GOOGL\4_2023-01-27' --> 'data\processed_data\GOOGL\4_2023-01-27.md'


2025-11-14 16:46:18,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:18,687 - INFO - Going to convert document batch...
2025-11-14 16:46:18,688 - INFO - Processing document 4_2023-02-08
2025-11-14 16:46:18,715 - INFO - Finished converting document 4_2023-02-08 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-02-01' --> 'data\processed_data\GOOGL\4_2023-02-01.md'
Converted 'data\edgar_documents\GOOGL\4_2023-02-08' --> 'data\processed_data\GOOGL\4_2023-02-08.md'


2025-11-14 16:46:18,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:18,900 - INFO - Going to convert document batch...
2025-11-14 16:46:18,901 - INFO - Processing document 4_2023-02-28
2025-11-14 16:46:18,933 - INFO - Finished converting document 4_2023-02-28 in 0.09 sec.
2025-11-14 16:46:18,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:19,003 - INFO - Going to convert document batch...
2025-11-14 16:46:19,004 - INFO - Processing document 4_2023-03-01
2025-11-14 16:46:19,037 - INFO - Finished converting document 4_2023-03-01 in 0.06 sec.
2025-11-14 16:46:19,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:19,088 - INFO - Going to convert document batch...
2025-11-14 16:46:19,089 - INFO - Processing document 4_2023-03-10
2025-11-14 16:46:19,119 - INFO - Finished converting document 4_2023-03-10 in 0.06 sec.
2025-11-14 16:46:19,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2023-02-28' --> 'data\processed_data\GOOGL\4_2023-02-28.md'
Converted 'data\edgar_documents\GOOGL\4_2023-03-01' --> 'data\processed_data\GOOGL\4_2023-03-01.md'
Converted 'data\edgar_documents\GOOGL\4_2023-03-10' --> 'data\processed_data\GOOGL\4_2023-03-10.md'


2025-11-14 16:46:19,182 - INFO - Going to convert document batch...
2025-11-14 16:46:19,183 - INFO - Processing document 4_2023-03-15
2025-11-14 16:46:19,259 - INFO - Finished converting document 4_2023-03-15 in 0.11 sec.
2025-11-14 16:46:19,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:19,387 - INFO - Going to convert document batch...
2025-11-14 16:46:19,388 - INFO - Processing document 4_2023-03-16
2025-11-14 16:46:19,427 - INFO - Finished converting document 4_2023-03-16 in 0.11 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-03-15' --> 'data\processed_data\GOOGL\4_2023-03-15.md'
Converted 'data\edgar_documents\GOOGL\4_2023-03-16' --> 'data\processed_data\GOOGL\4_2023-03-16.md'


2025-11-14 16:46:19,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:19,543 - INFO - Going to convert document batch...
2025-11-14 16:46:19,543 - INFO - Processing document 4_2023-03-28
2025-11-14 16:46:19,589 - INFO - Finished converting document 4_2023-03-28 in 0.14 sec.
2025-11-14 16:46:19,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:19,699 - INFO - Going to convert document batch...
2025-11-14 16:46:19,700 - INFO - Processing document 4_2023-03-31
2025-11-14 16:46:19,734 - INFO - Finished converting document 4_2023-03-31 in 0.11 sec.
2025-11-14 16:46:19,779 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:19,790 - INFO - Going to convert document batch...
2025-11-14 16:46:19,791 - INFO - Processing document 4_2023-04-04


Converted 'data\edgar_documents\GOOGL\4_2023-03-28' --> 'data\processed_data\GOOGL\4_2023-03-28.md'
Converted 'data\edgar_documents\GOOGL\4_2023-03-31' --> 'data\processed_data\GOOGL\4_2023-03-31.md'


2025-11-14 16:46:19,818 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.
2025-11-14 16:46:19,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:19,963 - INFO - Going to convert document batch...
2025-11-14 16:46:19,964 - INFO - Processing document 4_2023-04-13
2025-11-14 16:46:19,987 - INFO - Finished converting document 4_2023-04-13 in 0.12 sec.
2025-11-14 16:46:20,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:20,048 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GOOGL\4_2023-04-04' --> 'data\processed_data\GOOGL\4_2023-04-04.md'
Converted 'data\edgar_documents\GOOGL\4_2023-04-13' --> 'data\processed_data\GOOGL\4_2023-04-13.md'


2025-11-14 16:46:20,050 - INFO - Processing document 4_2023-04-27
2025-11-14 16:46:20,102 - INFO - Finished converting document 4_2023-04-27 in 0.08 sec.
2025-11-14 16:46:20,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:20,240 - INFO - Going to convert document batch...
2025-11-14 16:46:20,241 - INFO - Processing document 4_2023-05-02
2025-11-14 16:46:20,282 - INFO - Finished converting document 4_2023-05-02 in 0.11 sec.
2025-11-14 16:46:20,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:20,353 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GOOGL\4_2023-04-27' --> 'data\processed_data\GOOGL\4_2023-04-27.md'
Converted 'data\edgar_documents\GOOGL\4_2023-05-02' --> 'data\processed_data\GOOGL\4_2023-05-02.md'


2025-11-14 16:46:20,354 - INFO - Processing document 4_2023-05-03
2025-11-14 16:46:20,386 - INFO - Finished converting document 4_2023-05-03 in 0.06 sec.
2025-11-14 16:46:20,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:20,450 - INFO - Going to convert document batch...
2025-11-14 16:46:20,451 - INFO - Processing document 4_2023-05-05
2025-11-14 16:46:20,489 - INFO - Finished converting document 4_2023-05-05 in 0.06 sec.
2025-11-14 16:46:20,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:20,553 - INFO - Going to convert document batch...
2025-11-14 16:46:20,553 - INFO - Processing document 4_2023-05-09
2025-11-14 16:46:20,593 - INFO - Finished converting document 4_2023-05-09 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-05-03' --> 'data\processed_data\GOOGL\4_2023-05-03.md'
Converted 'data\edgar_documents\GOOGL\4_2023-05-05' --> 'data\processed_data\GOOGL\4_2023-05-05.md'


2025-11-14 16:46:20,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:20,710 - INFO - Going to convert document batch...
2025-11-14 16:46:20,710 - INFO - Processing document 4_2023-05-10


Converted 'data\edgar_documents\GOOGL\4_2023-05-09' --> 'data\processed_data\GOOGL\4_2023-05-09.md'


2025-11-14 16:46:20,875 - INFO - Finished converting document 4_2023-05-10 in 0.23 sec.
2025-11-14 16:46:20,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:20,970 - INFO - Going to convert document batch...
2025-11-14 16:46:20,971 - INFO - Processing document 4_2023-05-12
2025-11-14 16:46:21,043 - INFO - Finished converting document 4_2023-05-12 in 0.11 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-05-10' --> 'data\processed_data\GOOGL\4_2023-05-10.md'
Converted 'data\edgar_documents\GOOGL\4_2023-05-12' --> 'data\processed_data\GOOGL\4_2023-05-12.md'


2025-11-14 16:46:21,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:21,185 - INFO - Going to convert document batch...
2025-11-14 16:46:21,187 - INFO - Processing document 4_2023-05-15
2025-11-14 16:46:21,238 - INFO - Finished converting document 4_2023-05-15 in 0.11 sec.
2025-11-14 16:46:21,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2023-05-15' --> 'data\processed_data\GOOGL\4_2023-05-15.md'


2025-11-14 16:46:21,975 - INFO - Going to convert document batch...
2025-11-14 16:46:21,976 - INFO - Processing document 4_2023-05-16
2025-11-14 16:46:22,064 - INFO - Finished converting document 4_2023-05-16 in 0.78 sec.
2025-11-14 16:46:22,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:22,215 - INFO - Going to convert document batch...
2025-11-14 16:46:22,218 - INFO - Processing document 4_2023-05-18
2025-11-14 16:46:22,301 - INFO - Finished converting document 4_2023-05-18 in 0.17 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-05-16' --> 'data\processed_data\GOOGL\4_2023-05-16.md'


2025-11-14 16:46:22,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:22,435 - INFO - Going to convert document batch...
2025-11-14 16:46:22,436 - INFO - Processing document 4_2023-05-22
2025-11-14 16:46:22,513 - INFO - Finished converting document 4_2023-05-22 in 0.16 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-05-18' --> 'data\processed_data\GOOGL\4_2023-05-18.md'


2025-11-14 16:46:22,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:22,615 - INFO - Going to convert document batch...
2025-11-14 16:46:22,616 - INFO - Processing document 4_2023-05-24
2025-11-14 16:46:22,694 - INFO - Finished converting document 4_2023-05-24 in 0.12 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-05-22' --> 'data\processed_data\GOOGL\4_2023-05-22.md'
Converted 'data\edgar_documents\GOOGL\4_2023-05-24' --> 'data\processed_data\GOOGL\4_2023-05-24.md'


2025-11-14 16:46:22,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:22,830 - INFO - Going to convert document batch...
2025-11-14 16:46:22,830 - INFO - Processing document 4_2023-05-26
2025-11-14 16:46:22,870 - INFO - Finished converting document 4_2023-05-26 in 0.12 sec.
2025-11-14 16:46:22,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:22,983 - INFO - Going to convert document batch...
2025-11-14 16:46:22,984 - INFO - Processing document 4_2023-05-31
2025-11-14 16:46:23,014 - INFO - Finished converting document 4_2023-05-31 in 0.11 sec.
2025-11-14 16:46:23,071 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:23,083 - INFO - Going to convert document batch...
2025-11-14 16:46:23,083 - INFO - Processing document 4_2023-06-02


Converted 'data\edgar_documents\GOOGL\4_2023-05-26' --> 'data\processed_data\GOOGL\4_2023-05-26.md'
Converted 'data\edgar_documents\GOOGL\4_2023-05-31' --> 'data\processed_data\GOOGL\4_2023-05-31.md'


2025-11-14 16:46:23,112 - INFO - Finished converting document 4_2023-06-02 in 0.06 sec.
2025-11-14 16:46:23,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:23,302 - INFO - Going to convert document batch...
2025-11-14 16:46:23,303 - INFO - Processing document 4_2023-06-07
2025-11-14 16:46:23,325 - INFO - Finished converting document 4_2023-06-07 in 0.08 sec.
2025-11-14 16:46:23,370 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:23,398 - INFO - Going to convert document batch...
2025-11-14 16:46:23,399 - INFO - Processing document 4_2023-06-09


Converted 'data\edgar_documents\GOOGL\4_2023-06-02' --> 'data\processed_data\GOOGL\4_2023-06-02.md'
Converted 'data\edgar_documents\GOOGL\4_2023-06-07' --> 'data\processed_data\GOOGL\4_2023-06-07.md'


2025-11-14 16:46:23,466 - INFO - Finished converting document 4_2023-06-09 in 0.11 sec.
2025-11-14 16:46:23,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:23,606 - INFO - Going to convert document batch...
2025-11-14 16:46:23,608 - INFO - Processing document 4_2023-06-13
2025-11-14 16:46:23,637 - INFO - Finished converting document 4_2023-06-13 in 0.11 sec.
2025-11-14 16:46:23,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:23,709 - INFO - Going to convert document batch...
2025-11-14 16:46:23,710 - INFO - Processing document 4_2023-06-15


Converted 'data\edgar_documents\GOOGL\4_2023-06-09' --> 'data\processed_data\GOOGL\4_2023-06-09.md'
Converted 'data\edgar_documents\GOOGL\4_2023-06-13' --> 'data\processed_data\GOOGL\4_2023-06-13.md'


2025-11-14 16:46:23,791 - INFO - Finished converting document 4_2023-06-15 in 0.12 sec.
2025-11-14 16:46:23,906 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:23,932 - INFO - Going to convert document batch...
2025-11-14 16:46:23,932 - INFO - Processing document 4_2023-06-20
2025-11-14 16:46:24,003 - INFO - Finished converting document 4_2023-06-20 in 0.14 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-06-15' --> 'data\processed_data\GOOGL\4_2023-06-15.md'
Converted 'data\edgar_documents\GOOGL\4_2023-06-20' --> 'data\processed_data\GOOGL\4_2023-06-20.md'


2025-11-14 16:46:24,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:24,095 - INFO - Going to convert document batch...
2025-11-14 16:46:24,095 - INFO - Processing document 4_2023-06-22
2025-11-14 16:46:24,175 - INFO - Finished converting document 4_2023-06-22 in 0.11 sec.
2025-11-14 16:46:24,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:24,301 - INFO - Going to convert document batch...
2025-11-14 16:46:24,302 - INFO - Processing document 4_2023-06-27
2025-11-14 16:46:24,351 - INFO - Finished converting document 4_2023-06-27 in 0.12 sec.
2025-11-14 16:46:24,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2023-06-22' --> 'data\processed_data\GOOGL\4_2023-06-22.md'
Converted 'data\edgar_documents\GOOGL\4_2023-06-27' --> 'data\processed_data\GOOGL\4_2023-06-27.md'


2025-11-14 16:46:24,457 - INFO - Going to convert document batch...
2025-11-14 16:46:24,458 - INFO - Processing document 4_2023-06-28
2025-11-14 16:46:24,525 - INFO - Finished converting document 4_2023-06-28 in 0.14 sec.
2025-11-14 16:46:24,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:24,624 - INFO - Going to convert document batch...
2025-11-14 16:46:24,625 - INFO - Processing document 4_2023-06-29
2025-11-14 16:46:24,652 - INFO - Finished converting document 4_2023-06-29 in 0.09 sec.
2025-11-14 16:46:24,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:24,705 - INFO - Going to convert document batch...
2025-11-14 16:46:24,706 - INFO - Processing document 4_2023-07-05
2025-11-14 16:46:24,732 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-06-28' --> 'data\processed_data\GOOGL\4_2023-06-28.md'
Converted 'data\edgar_documents\GOOGL\4_2023-06-29' --> 'data\processed_data\GOOGL\4_2023-06-29.md'


2025-11-14 16:46:24,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:24,802 - INFO - Going to convert document batch...
2025-11-14 16:46:24,837 - INFO - Processing document 4_2023-07-06
2025-11-14 16:46:24,940 - INFO - Finished converting document 4_2023-07-06 in 0.17 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-07-05' --> 'data\processed_data\GOOGL\4_2023-07-05.md'


2025-11-14 16:46:25,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:25,035 - INFO - Going to convert document batch...
2025-11-14 16:46:25,036 - INFO - Processing document 4_2023-07-13
2025-11-14 16:46:25,066 - INFO - Finished converting document 4_2023-07-13 in 0.09 sec.
2025-11-14 16:46:25,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:25,157 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GOOGL\4_2023-07-06' --> 'data\processed_data\GOOGL\4_2023-07-06.md'
Converted 'data\edgar_documents\GOOGL\4_2023-07-13' --> 'data\processed_data\GOOGL\4_2023-07-13.md'


2025-11-14 16:46:25,159 - INFO - Processing document 4_2023-07-14
2025-11-14 16:46:25,306 - INFO - Finished converting document 4_2023-07-14 in 0.19 sec.
2025-11-14 16:46:25,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:25,423 - INFO - Going to convert document batch...
2025-11-14 16:46:25,425 - INFO - Processing document 4_2023-07-27
2025-11-14 16:46:25,454 - INFO - Finished converting document 4_2023-07-27 in 0.11 sec.
2025-11-14 16:46:25,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:25,512 - INFO - Going to convert document batch...
2025-11-14 16:46:25,513 - INFO - Processing document 4_2023-07-28
2025-11-14 16:46:25,537 - INFO - Finished converting document 4_2023-07-28 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-07-14' --> 'data\processed_data\GOOGL\4_2023-07-14.md'
Converted 'data\edgar_documents\GOOGL\4_2023-07-27' --> 'data\processed_data\GOOGL\4_2023-07-27.md'


2025-11-14 16:46:25,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:25,588 - INFO - Going to convert document batch...
2025-11-14 16:46:25,589 - INFO - Processing document 4_2023-08-10
2025-11-14 16:46:25,623 - INFO - Finished converting document 4_2023-08-10 in 0.06 sec.
2025-11-14 16:46:25,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:25,703 - INFO - Going to convert document batch...
2025-11-14 16:46:25,703 - INFO - Processing document 4_2023-08-21
2025-11-14 16:46:25,775 - INFO - Finished converting document 4_2023-08-21 in 0.11 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-07-28' --> 'data\processed_data\GOOGL\4_2023-07-28.md'
Converted 'data\edgar_documents\GOOGL\4_2023-08-10' --> 'data\processed_data\GOOGL\4_2023-08-10.md'


2025-11-14 16:46:25,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:25,868 - INFO - Going to convert document batch...
2025-11-14 16:46:25,868 - INFO - Processing document 4_2023-08-29
2025-11-14 16:46:25,915 - INFO - Finished converting document 4_2023-08-29 in 0.06 sec.
2025-11-14 16:46:25,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:25,985 - INFO - Going to convert document batch...
2025-11-14 16:46:25,986 - INFO - Processing document 4_2023-09-01
2025-11-14 16:46:26,021 - INFO - Finished converting document 4_2023-09-01 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-08-21' --> 'data\processed_data\GOOGL\4_2023-08-21.md'
Converted 'data\edgar_documents\GOOGL\4_2023-08-29' --> 'data\processed_data\GOOGL\4_2023-08-29.md'
Converted 'data\edgar_documents\GOOGL\4_2023-09-01' --> 'data\processed_data\GOOGL\4_2023-09-01.md'


2025-11-14 16:46:26,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:26,071 - INFO - Going to convert document batch...
2025-11-14 16:46:26,071 - INFO - Processing document 4_2023-09-05
2025-11-14 16:46:26,100 - INFO - Finished converting document 4_2023-09-05 in 0.05 sec.
2025-11-14 16:46:26,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:26,157 - INFO - Going to convert document batch...
2025-11-14 16:46:26,158 - INFO - Processing document 4_2023-09-07


Converted 'data\edgar_documents\GOOGL\4_2023-09-05' --> 'data\processed_data\GOOGL\4_2023-09-05.md'


2025-11-14 16:46:26,458 - INFO - Finished converting document 4_2023-09-07 in 0.33 sec.
2025-11-14 16:46:26,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:26,540 - INFO - Going to convert document batch...
2025-11-14 16:46:26,541 - INFO - Processing document 4_2023-09-11
2025-11-14 16:46:26,568 - INFO - Finished converting document 4_2023-09-11 in 0.08 sec.
2025-11-14 16:46:26,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:26,639 - INFO - Going to convert document batch...
2025-11-14 16:46:26,639 - INFO - Processing document 4_2023-09-26
2025-11-14 16:46:26,677 - INFO - Finished converting document 4_2023-09-26 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-09-07' --> 'data\processed_data\GOOGL\4_2023-09-07.md'
Converted 'data\edgar_documents\GOOGL\4_2023-09-11' --> 'data\processed_data\GOOGL\4_2023-09-11.md'


2025-11-14 16:46:26,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:26,771 - INFO - Going to convert document batch...
2025-11-14 16:46:26,772 - INFO - Processing document 4_2023-09-27
2025-11-14 16:46:26,811 - INFO - Finished converting document 4_2023-09-27 in 0.11 sec.
2025-11-14 16:46:26,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2023-09-26' --> 'data\processed_data\GOOGL\4_2023-09-26.md'
Converted 'data\edgar_documents\GOOGL\4_2023-09-27' --> 'data\processed_data\GOOGL\4_2023-09-27.md'


2025-11-14 16:46:26,923 - INFO - Going to convert document batch...
2025-11-14 16:46:26,924 - INFO - Processing document 4_2023-09-28
2025-11-14 16:46:26,982 - INFO - Finished converting document 4_2023-09-28 in 0.14 sec.
2025-11-14 16:46:27,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:27,035 - INFO - Going to convert document batch...
2025-11-14 16:46:27,036 - INFO - Processing document 4_2023-10-02
2025-11-14 16:46:27,058 - INFO - Finished converting document 4_2023-10-02 in 0.05 sec.
2025-11-14 16:46:27,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:27,120 - INFO - Going to convert document batch...
2025-11-14 16:46:27,120 - INFO - Processing document 4_2023-10-04
2025-11-14 16:46:27,155 - INFO - Finished converting document 4_2023-10-04 in 0.08 sec.
2025-11-14 16:46:27,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2023-09-28' --> 'data\processed_data\GOOGL\4_2023-09-28.md'
Converted 'data\edgar_documents\GOOGL\4_2023-10-02' --> 'data\processed_data\GOOGL\4_2023-10-02.md'
Converted 'data\edgar_documents\GOOGL\4_2023-10-04' --> 'data\processed_data\GOOGL\4_2023-10-04.md'


2025-11-14 16:46:27,214 - INFO - Going to convert document batch...
2025-11-14 16:46:27,214 - INFO - Processing document 4_2023-10-10
2025-11-14 16:46:27,247 - INFO - Finished converting document 4_2023-10-10 in 0.06 sec.
2025-11-14 16:46:27,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:27,309 - INFO - Going to convert document batch...
2025-11-14 16:46:27,310 - INFO - Processing document 4_2023-10-26
2025-11-14 16:46:27,342 - INFO - Finished converting document 4_2023-10-26 in 0.06 sec.
2025-11-14 16:46:27,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:27,400 - INFO - Going to convert document batch...
2025-11-14 16:46:27,402 - INFO - Processing document 4_2023-10-27
2025-11-14 16:46:27,430 - INFO - Finished converting document 4_2023-10-27 in 0.05 sec.
2025-11-14 16:46:27,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2023-10-10' --> 'data\processed_data\GOOGL\4_2023-10-10.md'
Converted 'data\edgar_documents\GOOGL\4_2023-10-26' --> 'data\processed_data\GOOGL\4_2023-10-26.md'
Converted 'data\edgar_documents\GOOGL\4_2023-10-27' --> 'data\processed_data\GOOGL\4_2023-10-27.md'


2025-11-14 16:46:27,477 - INFO - Going to convert document batch...
2025-11-14 16:46:27,478 - INFO - Processing document 4_2023-10-30
2025-11-14 16:46:27,510 - INFO - Finished converting document 4_2023-10-30 in 0.06 sec.
2025-11-14 16:46:27,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:27,565 - INFO - Going to convert document batch...
2025-11-14 16:46:27,566 - INFO - Processing document 4_2023-11-03
2025-11-14 16:46:27,588 - INFO - Finished converting document 4_2023-11-03 in 0.05 sec.
2025-11-14 16:46:27,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:27,649 - INFO - Going to convert document batch...
2025-11-14 16:46:27,650 - INFO - Processing document 4_2023-11-09
2025-11-14 16:46:27,708 - INFO - Finished converting document 4_2023-11-09 in 0.09 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-10-30' --> 'data\processed_data\GOOGL\4_2023-10-30.md'
Converted 'data\edgar_documents\GOOGL\4_2023-11-03' --> 'data\processed_data\GOOGL\4_2023-11-03.md'
Converted 'data\edgar_documents\GOOGL\4_2023-11-09' --> 'data\processed_data\GOOGL\4_2023-11-09.md'


2025-11-14 16:46:27,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:27,821 - INFO - Going to convert document batch...
2025-11-14 16:46:27,822 - INFO - Processing document 4_2023-11-14
2025-11-14 16:46:27,959 - INFO - Finished converting document 4_2023-11-14 in 0.20 sec.
2025-11-14 16:46:28,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:28,073 - INFO - Going to convert document batch...
2025-11-14 16:46:28,073 - INFO - Processing document 4_2023-11-28
2025-11-14 16:46:28,109 - INFO - Finished converting document 4_2023-11-28 in 0.11 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-11-14' --> 'data\processed_data\GOOGL\4_2023-11-14.md'
Converted 'data\edgar_documents\GOOGL\4_2023-11-28' --> 'data\processed_data\GOOGL\4_2023-11-28.md'


2025-11-14 16:46:28,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:28,234 - INFO - Going to convert document batch...
2025-11-14 16:46:28,235 - INFO - Processing document 4_2023-11-29
2025-11-14 16:46:28,261 - INFO - Finished converting document 4_2023-11-29 in 0.12 sec.
2025-11-14 16:46:28,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:28,363 - INFO - Going to convert document batch...
2025-11-14 16:46:28,363 - INFO - Processing document 4_2023-11-30
2025-11-14 16:46:28,391 - INFO - Finished converting document 4_2023-11-30 in 0.09 sec.
2025-11-14 16:46:28,460 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:28,472 - INFO - Going to convert document batch...
2025-11-14 16:46:28,473 - INFO - Processing document 4_2023-12-01
2025-11-14 16:46:28,499 - INFO - Finished converting document 4_2023-12-01 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-11-29' --> 'data\processed_data\GOOGL\4_2023-11-29.md'
Converted 'data\edgar_documents\GOOGL\4_2023-11-30' --> 'data\processed_data\GOOGL\4_2023-11-30.md'


2025-11-14 16:46:28,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:28,550 - INFO - Going to convert document batch...
2025-11-14 16:46:28,551 - INFO - Processing document 4_2023-12-08
2025-11-14 16:46:28,580 - INFO - Finished converting document 4_2023-12-08 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-12-01' --> 'data\processed_data\GOOGL\4_2023-12-01.md'
Converted 'data\edgar_documents\GOOGL\4_2023-12-08' --> 'data\processed_data\GOOGL\4_2023-12-08.md'


2025-11-14 16:46:28,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:28,769 - INFO - Going to convert document batch...
2025-11-14 16:46:28,769 - INFO - Processing document 4_2023-12-11
2025-11-14 16:46:28,796 - INFO - Finished converting document 4_2023-12-11 in 0.09 sec.
2025-11-14 16:46:28,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:28,856 - INFO - Going to convert document batch...
2025-11-14 16:46:28,857 - INFO - Processing document 4_2023-12-21
2025-11-14 16:46:28,888 - INFO - Finished converting document 4_2023-12-21 in 0.06 sec.
2025-11-14 16:46:28,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:28,948 - INFO - Going to convert document batch...
2025-11-14 16:46:28,949 - INFO - Processing document 4_2023-12-27
2025-11-14 16:46:28,982 - INFO - Finished converting document 4_2023-12-27 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-12-11' --> 'data\processed_data\GOOGL\4_2023-12-11.md'
Converted 'data\edgar_documents\GOOGL\4_2023-12-21' --> 'data\processed_data\GOOGL\4_2023-12-21.md'
Converted 'data\edgar_documents\GOOGL\4_2023-12-27' --> 'data\processed_data\GOOGL\4_2023-12-27.md'


2025-11-14 16:46:29,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:29,050 - INFO - Going to convert document batch...
2025-11-14 16:46:29,051 - INFO - Processing document 4_2023-12-29
2025-11-14 16:46:29,080 - INFO - Finished converting document 4_2023-12-29 in 0.06 sec.
2025-11-14 16:46:29,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:29,245 - INFO - Going to convert document batch...
2025-11-14 16:46:29,247 - INFO - Processing document 4_2024-01-02
2025-11-14 16:46:29,269 - INFO - Finished converting document 4_2024-01-02 in 0.05 sec.
2025-11-14 16:46:29,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:29,326 - INFO - Going to convert document batch...
2025-11-14 16:46:29,327 - INFO - Processing document 4_2024-01-03
2025-11-14 16:46:29,362 - INFO - Finished converting document 4_2024-01-03 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2023-12-29' --> 'data\processed_data\GOOGL\4_2023-12-29.md'
Converted 'data\edgar_documents\GOOGL\4_2024-01-02' --> 'data\processed_data\GOOGL\4_2024-01-02.md'


2025-11-14 16:46:29,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:29,421 - INFO - Going to convert document batch...
2025-11-14 16:46:29,422 - INFO - Processing document 4_2024-01-04
2025-11-14 16:46:29,465 - INFO - Finished converting document 4_2024-01-04 in 0.08 sec.
2025-11-14 16:46:29,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:29,547 - INFO - Going to convert document batch...
2025-11-14 16:46:29,548 - INFO - Processing document 4_2024-01-10
2025-11-14 16:46:29,574 - INFO - Finished converting document 4_2024-01-10 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-01-03' --> 'data\processed_data\GOOGL\4_2024-01-03.md'
Converted 'data\edgar_documents\GOOGL\4_2024-01-04' --> 'data\processed_data\GOOGL\4_2024-01-04.md'


2025-11-14 16:46:29,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:29,648 - INFO - Going to convert document batch...
2025-11-14 16:46:29,650 - INFO - Processing document 4_2024-01-12
2025-11-14 16:46:29,689 - INFO - Finished converting document 4_2024-01-12 in 0.09 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-01-10' --> 'data\processed_data\GOOGL\4_2024-01-10.md'
Converted 'data\edgar_documents\GOOGL\4_2024-01-12' --> 'data\processed_data\GOOGL\4_2024-01-12.md'


2025-11-14 16:46:29,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:29,879 - INFO - Going to convert document batch...
2025-11-14 16:46:29,880 - INFO - Processing document 4_2024-01-17
2025-11-14 16:46:29,912 - INFO - Finished converting document 4_2024-01-17 in 0.17 sec.
2025-11-14 16:46:29,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:29,969 - INFO - Going to convert document batch...
2025-11-14 16:46:29,970 - INFO - Processing document 4_2024-01-26
2025-11-14 16:46:30,003 - INFO - Finished converting document 4_2024-01-26 in 0.06 sec.
2025-11-14 16:46:30,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:30,050 - INFO - Going to convert document batch...
2025-11-14 16:46:30,050 - INFO - Processing document 4_2024-01-30
2025-11-14 16:46:30,076 - INFO - Finished converting document 4_2024-01-30 in 0.05 sec.
2025-11-14 16:46:30,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GOOGL\4_2024-01-17' --> 'data\processed_data\GOOGL\4_2024-01-17.md'
Converted 'data\edgar_documents\GOOGL\4_2024-01-26' --> 'data\processed_data\GOOGL\4_2024-01-26.md'
Converted 'data\edgar_documents\GOOGL\4_2024-01-30' --> 'data\processed_data\GOOGL\4_2024-01-30.md'


2025-11-14 16:46:30,124 - INFO - Processing document 4_2024-02-01
2025-11-14 16:46:30,150 - INFO - Finished converting document 4_2024-02-01 in 0.06 sec.
2025-11-14 16:46:30,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:30,202 - INFO - Going to convert document batch...
2025-11-14 16:46:30,232 - INFO - Processing document 4_2024-02-08
2025-11-14 16:46:30,306 - INFO - Finished converting document 4_2024-02-08 in 0.12 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-02-01' --> 'data\processed_data\GOOGL\4_2024-02-01.md'
Converted 'data\edgar_documents\GOOGL\4_2024-02-08' --> 'data\processed_data\GOOGL\4_2024-02-08.md'


2025-11-14 16:46:30,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:30,461 - INFO - Going to convert document batch...
2025-11-14 16:46:30,462 - INFO - Processing document 4_2024-02-09
2025-11-14 16:46:30,501 - INFO - Finished converting document 4_2024-02-09 in 0.17 sec.
2025-11-14 16:46:30,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:30,604 - INFO - Going to convert document batch...
2025-11-14 16:46:30,605 - INFO - Processing document 4_2024-02-13
2025-11-14 16:46:30,648 - INFO - Finished converting document 4_2024-02-13 in 0.11 sec.
2025-11-14 16:46:30,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:30,700 - INFO - Going to convert document batch...
2025-11-14 16:46:30,701 - INFO - Processing document 4_2024-02-22
2025-11-14 16:46:30,720 - INFO - Finished converting document 4_2024-02-22 in 0.05 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-02-09' --> 'data\processed_data\GOOGL\4_2024-02-09.md'
Converted 'data\edgar_documents\GOOGL\4_2024-02-13' --> 'data\processed_data\GOOGL\4_2024-02-13.md'


2025-11-14 16:46:30,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:30,768 - INFO - Going to convert document batch...
2025-11-14 16:46:30,769 - INFO - Processing document 4_2024-02-23
2025-11-14 16:46:30,800 - INFO - Finished converting document 4_2024-02-23 in 0.05 sec.
2025-11-14 16:46:30,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-02-22' --> 'data\processed_data\GOOGL\4_2024-02-22.md'
Converted 'data\edgar_documents\GOOGL\4_2024-02-23' --> 'data\processed_data\GOOGL\4_2024-02-23.md'


2025-11-14 16:46:30,969 - INFO - Going to convert document batch...
2025-11-14 16:46:30,970 - INFO - Processing document 4_2024-02-27
2025-11-14 16:46:30,999 - INFO - Finished converting document 4_2024-02-27 in 0.08 sec.
2025-11-14 16:46:31,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:31,073 - INFO - Going to convert document batch...
2025-11-14 16:46:31,074 - INFO - Processing document 4_2024-02-29
2025-11-14 16:46:31,097 - INFO - Finished converting document 4_2024-02-29 in 0.06 sec.
2025-11-14 16:46:31,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:31,149 - INFO - Going to convert document batch...
2025-11-14 16:46:31,149 - INFO - Processing document 4_2024-03-04
2025-11-14 16:46:31,169 - INFO - Finished converting document 4_2024-03-04 in 0.05 sec.
2025-11-14 16:46:31,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-02-27' --> 'data\processed_data\GOOGL\4_2024-02-27.md'
Converted 'data\edgar_documents\GOOGL\4_2024-02-29' --> 'data\processed_data\GOOGL\4_2024-02-29.md'
Converted 'data\edgar_documents\GOOGL\4_2024-03-04' --> 'data\processed_data\GOOGL\4_2024-03-04.md'


2025-11-14 16:46:31,234 - INFO - Going to convert document batch...
2025-11-14 16:46:31,235 - INFO - Processing document 4_2024-03-06
2025-11-14 16:46:31,266 - INFO - Finished converting document 4_2024-03-06 in 0.08 sec.
2025-11-14 16:46:31,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:31,321 - INFO - Going to convert document batch...
2025-11-14 16:46:31,322 - INFO - Processing document 4_2024-03-08
2025-11-14 16:46:31,353 - INFO - Finished converting document 4_2024-03-08 in 0.05 sec.
2025-11-14 16:46:31,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:31,406 - INFO - Going to convert document batch...
2025-11-14 16:46:31,407 - INFO - Processing document 4_2024-03-12
2025-11-14 16:46:31,435 - INFO - Finished converting document 4_2024-03-12 in 0.06 sec.
2025-11-14 16:46:31,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-03-06' --> 'data\processed_data\GOOGL\4_2024-03-06.md'
Converted 'data\edgar_documents\GOOGL\4_2024-03-08' --> 'data\processed_data\GOOGL\4_2024-03-08.md'
Converted 'data\edgar_documents\GOOGL\4_2024-03-12' --> 'data\processed_data\GOOGL\4_2024-03-12.md'


2025-11-14 16:46:31,869 - INFO - Going to convert document batch...
2025-11-14 16:46:31,870 - INFO - Processing document 4_2024-03-19
2025-11-14 16:46:31,901 - INFO - Finished converting document 4_2024-03-19 in 0.44 sec.
2025-11-14 16:46:31,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:31,958 - INFO - Going to convert document batch...
2025-11-14 16:46:31,959 - INFO - Processing document 4_2024-03-20
2025-11-14 16:46:31,983 - INFO - Finished converting document 4_2024-03-20 in 0.05 sec.
2025-11-14 16:46:32,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:32,046 - INFO - Going to convert document batch...
2025-11-14 16:46:32,047 - INFO - Processing document 4_2024-03-26
2025-11-14 16:46:32,080 - INFO - Finished converting document 4_2024-03-26 in 0.08 sec.
2025-11-14 16:46:32,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-03-19' --> 'data\processed_data\GOOGL\4_2024-03-19.md'
Converted 'data\edgar_documents\GOOGL\4_2024-03-20' --> 'data\processed_data\GOOGL\4_2024-03-20.md'
Converted 'data\edgar_documents\GOOGL\4_2024-03-26' --> 'data\processed_data\GOOGL\4_2024-03-26.md'


2025-11-14 16:46:32,137 - INFO - Going to convert document batch...
2025-11-14 16:46:32,138 - INFO - Processing document 4_2024-03-29
2025-11-14 16:46:32,179 - INFO - Finished converting document 4_2024-03-29 in 0.06 sec.
2025-11-14 16:46:32,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:32,229 - INFO - Going to convert document batch...
2025-11-14 16:46:32,230 - INFO - Processing document 4_2024-04-02
2025-11-14 16:46:32,256 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 16:46:32,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:32,316 - INFO - Going to convert document batch...
2025-11-14 16:46:32,317 - INFO - Processing document 4_2024-04-04
2025-11-14 16:46:32,342 - INFO - Finished converting document 4_2024-04-04 in 0.06 sec.
2025-11-14 16:46:32,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-03-29' --> 'data\processed_data\GOOGL\4_2024-03-29.md'
Converted 'data\edgar_documents\GOOGL\4_2024-04-02' --> 'data\processed_data\GOOGL\4_2024-04-02.md'
Converted 'data\edgar_documents\GOOGL\4_2024-04-04' --> 'data\processed_data\GOOGL\4_2024-04-04.md'


2025-11-14 16:46:32,412 - INFO - Going to convert document batch...
2025-11-14 16:46:32,413 - INFO - Processing document 4_2024-04-15
2025-11-14 16:46:32,453 - INFO - Finished converting document 4_2024-04-15 in 0.08 sec.
2025-11-14 16:46:32,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:32,586 - INFO - Going to convert document batch...
2025-11-14 16:46:32,587 - INFO - Processing document 4_2024-04-17
2025-11-14 16:46:32,618 - INFO - Finished converting document 4_2024-04-17 in 0.11 sec.
2025-11-14 16:46:32,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:32,692 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GOOGL\4_2024-04-15' --> 'data\processed_data\GOOGL\4_2024-04-15.md'
Converted 'data\edgar_documents\GOOGL\4_2024-04-17' --> 'data\processed_data\GOOGL\4_2024-04-17.md'


2025-11-14 16:46:32,692 - INFO - Processing document 4_2024-04-26
2025-11-14 16:46:32,729 - INFO - Finished converting document 4_2024-04-26 in 0.08 sec.
2025-11-14 16:46:32,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:32,793 - INFO - Going to convert document batch...
2025-11-14 16:46:32,794 - INFO - Processing document 4_2024-04-30
2025-11-14 16:46:32,823 - INFO - Finished converting document 4_2024-04-30 in 0.06 sec.
2025-11-14 16:46:32,861 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:32,875 - INFO - Going to convert document batch...
2025-11-14 16:46:32,875 - INFO - Processing document 4_2024-05-01
2025-11-14 16:46:32,902 - INFO - Finished converting document 4_2024-05-01 in 0.06 sec.
2025-11-14 16:46:32,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:32,948 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GOOGL\4_2024-04-26' --> 'data\processed_data\GOOGL\4_2024-04-26.md'
Converted 'data\edgar_documents\GOOGL\4_2024-04-30' --> 'data\processed_data\GOOGL\4_2024-04-30.md'
Converted 'data\edgar_documents\GOOGL\4_2024-05-01' --> 'data\processed_data\GOOGL\4_2024-05-01.md'


2025-11-14 16:46:32,949 - INFO - Processing document 4_2024-05-03
2025-11-14 16:46:32,979 - INFO - Finished converting document 4_2024-05-03 in 0.06 sec.
2025-11-14 16:46:33,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:33,035 - INFO - Going to convert document batch...
2025-11-14 16:46:33,036 - INFO - Processing document 4_2024-05-13
2025-11-14 16:46:33,068 - INFO - Finished converting document 4_2024-05-13 in 0.06 sec.
2025-11-14 16:46:33,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:33,119 - INFO - Going to convert document batch...
2025-11-14 16:46:33,120 - INFO - Processing document 4_2024-05-14
2025-11-14 16:46:33,150 - INFO - Finished converting document 4_2024-05-14 in 0.05 sec.
2025-11-14 16:46:33,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-05-03' --> 'data\processed_data\GOOGL\4_2024-05-03.md'
Converted 'data\edgar_documents\GOOGL\4_2024-05-13' --> 'data\processed_data\GOOGL\4_2024-05-13.md'
Converted 'data\edgar_documents\GOOGL\4_2024-05-14' --> 'data\processed_data\GOOGL\4_2024-05-14.md'


2025-11-14 16:46:33,195 - INFO - Going to convert document batch...
2025-11-14 16:46:33,196 - INFO - Processing document 4_2024-05-15
2025-11-14 16:46:33,225 - INFO - Finished converting document 4_2024-05-15 in 0.05 sec.
2025-11-14 16:46:33,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:33,396 - INFO - Going to convert document batch...
2025-11-14 16:46:33,396 - INFO - Processing document 4_2024-05-29
2025-11-14 16:46:33,422 - INFO - Finished converting document 4_2024-05-29 in 0.08 sec.
2025-11-14 16:46:33,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:33,477 - INFO - Going to convert document batch...
2025-11-14 16:46:33,479 - INFO - Processing document 4_2024-06-03
2025-11-14 16:46:33,515 - INFO - Finished converting document 4_2024-06-03 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-05-15' --> 'data\processed_data\GOOGL\4_2024-05-15.md'
Converted 'data\edgar_documents\GOOGL\4_2024-05-29' --> 'data\processed_data\GOOGL\4_2024-05-29.md'
Converted 'data\edgar_documents\GOOGL\4_2024-06-03' --> 'data\processed_data\GOOGL\4_2024-06-03.md'


2025-11-14 16:46:33,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:33,577 - INFO - Going to convert document batch...
2025-11-14 16:46:33,578 - INFO - Processing document 4_2024-06-05
2025-11-14 16:46:33,618 - INFO - Finished converting document 4_2024-06-05 in 0.08 sec.
2025-11-14 16:46:33,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:33,710 - INFO - Going to convert document batch...
2025-11-14 16:46:33,711 - INFO - Processing document 4_2024-06-12
2025-11-14 16:46:33,746 - INFO - Finished converting document 4_2024-06-12 in 0.08 sec.
2025-11-14 16:46:33,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:33,798 - INFO - Going to convert document batch...
2025-11-14 16:46:33,799 - INFO - Processing document 4_2024-06-18
2025-11-14 16:46:33,828 - INFO - Finished converting document 4_2024-06-18 in 0.06 sec.
2025-11-14 16:46:33,866 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-06-05' --> 'data\processed_data\GOOGL\4_2024-06-05.md'
Converted 'data\edgar_documents\GOOGL\4_2024-06-12' --> 'data\processed_data\GOOGL\4_2024-06-12.md'
Converted 'data\edgar_documents\GOOGL\4_2024-06-18' --> 'data\processed_data\GOOGL\4_2024-06-18.md'


2025-11-14 16:46:33,876 - INFO - Going to convert document batch...
2025-11-14 16:46:33,877 - INFO - Processing document 4_2024-06-21
2025-11-14 16:46:33,903 - INFO - Finished converting document 4_2024-06-21 in 0.05 sec.
2025-11-14 16:46:34,061 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:34,078 - INFO - Going to convert document batch...
2025-11-14 16:46:34,079 - INFO - Processing document 4_2024-06-26
2025-11-14 16:46:34,119 - INFO - Finished converting document 4_2024-06-26 in 0.08 sec.
2025-11-14 16:46:34,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-06-21' --> 'data\processed_data\GOOGL\4_2024-06-21.md'
Converted 'data\edgar_documents\GOOGL\4_2024-06-26' --> 'data\processed_data\GOOGL\4_2024-06-26.md'


2025-11-14 16:46:34,251 - INFO - Going to convert document batch...
2025-11-14 16:46:34,253 - INFO - Processing document 4_2024-06-27
2025-11-14 16:46:34,295 - INFO - Finished converting document 4_2024-06-27 in 0.12 sec.
2025-11-14 16:46:34,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:34,399 - INFO - Going to convert document batch...
2025-11-14 16:46:34,400 - INFO - Processing document 4_2024-07-02
2025-11-14 16:46:34,422 - INFO - Finished converting document 4_2024-07-02 in 0.09 sec.
2025-11-14 16:46:34,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:34,468 - INFO - Going to convert document batch...
2025-11-14 16:46:34,469 - INFO - Processing document 4_2024-07-03
2025-11-14 16:46:34,492 - INFO - Finished converting document 4_2024-07-03 in 0.05 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-06-27' --> 'data\processed_data\GOOGL\4_2024-06-27.md'
Converted 'data\edgar_documents\GOOGL\4_2024-07-02' --> 'data\processed_data\GOOGL\4_2024-07-02.md'
Converted 'data\edgar_documents\GOOGL\4_2024-07-03' --> 'data\processed_data\GOOGL\4_2024-07-03.md'


2025-11-14 16:46:34,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:34,547 - INFO - Going to convert document batch...
2025-11-14 16:46:34,548 - INFO - Processing document 4_2024-07-05
2025-11-14 16:46:34,657 - INFO - Finished converting document 4_2024-07-05 in 0.14 sec.
2025-11-14 16:46:34,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:34,776 - INFO - Going to convert document batch...
2025-11-14 16:46:34,777 - INFO - Processing document 4_2024-07-16
2025-11-14 16:46:34,807 - INFO - Finished converting document 4_2024-07-16 in 0.12 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-07-05' --> 'data\processed_data\GOOGL\4_2024-07-05.md'
Converted 'data\edgar_documents\GOOGL\4_2024-07-16' --> 'data\processed_data\GOOGL\4_2024-07-16.md'


2025-11-14 16:46:34,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:34,921 - INFO - Going to convert document batch...
2025-11-14 16:46:34,922 - INFO - Processing document 4_2024-07-18
2025-11-14 16:46:34,955 - INFO - Finished converting document 4_2024-07-18 in 0.12 sec.
2025-11-14 16:46:35,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:35,055 - INFO - Going to convert document batch...
2025-11-14 16:46:35,057 - INFO - Processing document 4_2024-07-26
2025-11-14 16:46:35,090 - INFO - Finished converting document 4_2024-07-26 in 0.11 sec.
2025-11-14 16:46:35,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:35,144 - INFO - Going to convert document batch...
2025-11-14 16:46:35,145 - INFO - Processing document 4_2024-07-30
2025-11-14 16:46:35,186 - INFO - Finished converting document 4_2024-07-30 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-07-18' --> 'data\processed_data\GOOGL\4_2024-07-18.md'
Converted 'data\edgar_documents\GOOGL\4_2024-07-26' --> 'data\processed_data\GOOGL\4_2024-07-26.md'


2025-11-14 16:46:35,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:35,241 - INFO - Going to convert document batch...
2025-11-14 16:46:35,242 - INFO - Processing document 4_2024-08-02
2025-11-14 16:46:35,277 - INFO - Finished converting document 4_2024-08-02 in 0.06 sec.
2025-11-14 16:46:35,314 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:35,327 - INFO - Going to convert document batch...
2025-11-14 16:46:35,328 - INFO - Processing document 4_2024-08-07
2025-11-14 16:46:35,354 - INFO - Finished converting document 4_2024-08-07 in 0.06 sec.
2025-11-14 16:46:35,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-07-30' --> 'data\processed_data\GOOGL\4_2024-07-30.md'
Converted 'data\edgar_documents\GOOGL\4_2024-08-02' --> 'data\processed_data\GOOGL\4_2024-08-02.md'
Converted 'data\edgar_documents\GOOGL\4_2024-08-07' --> 'data\processed_data\GOOGL\4_2024-08-07.md'


2025-11-14 16:46:35,415 - INFO - Going to convert document batch...
2025-11-14 16:46:35,416 - INFO - Processing document 4_2024-08-09
2025-11-14 16:46:35,442 - INFO - Finished converting document 4_2024-08-09 in 0.05 sec.
2025-11-14 16:46:35,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:35,495 - INFO - Going to convert document batch...
2025-11-14 16:46:35,496 - INFO - Processing document 4_2024-08-12
2025-11-14 16:46:35,525 - INFO - Finished converting document 4_2024-08-12 in 0.05 sec.
2025-11-14 16:46:35,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:35,578 - INFO - Going to convert document batch...
2025-11-14 16:46:35,578 - INFO - Processing document 4_2024-08-16
2025-11-14 16:46:35,602 - INFO - Finished converting document 4_2024-08-16 in 0.05 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-08-09' --> 'data\processed_data\GOOGL\4_2024-08-09.md'
Converted 'data\edgar_documents\GOOGL\4_2024-08-12' --> 'data\processed_data\GOOGL\4_2024-08-12.md'
Converted 'data\edgar_documents\GOOGL\4_2024-08-16' --> 'data\processed_data\GOOGL\4_2024-08-16.md'


2025-11-14 16:46:35,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:35,673 - INFO - Going to convert document batch...
2025-11-14 16:46:35,675 - INFO - Processing document 4_2024-08-19
2025-11-14 16:46:35,718 - INFO - Finished converting document 4_2024-08-19 in 0.09 sec.
2025-11-14 16:46:35,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:35,769 - INFO - Going to convert document batch...
2025-11-14 16:46:35,770 - INFO - Processing document 4_2024-08-21
2025-11-14 16:46:35,796 - INFO - Finished converting document 4_2024-08-21 in 0.05 sec.
2025-11-14 16:46:35,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:35,846 - INFO - Going to convert document batch...
2025-11-14 16:46:35,847 - INFO - Processing document 4_2024-08-27
2025-11-14 16:46:35,882 - INFO - Finished converting document 4_2024-08-27 in 0.06 sec.
2025-11-14 16:46:35,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-08-19' --> 'data\processed_data\GOOGL\4_2024-08-19.md'
Converted 'data\edgar_documents\GOOGL\4_2024-08-21' --> 'data\processed_data\GOOGL\4_2024-08-21.md'
Converted 'data\edgar_documents\GOOGL\4_2024-08-27' --> 'data\processed_data\GOOGL\4_2024-08-27.md'


2025-11-14 16:46:35,940 - INFO - Going to convert document batch...
2025-11-14 16:46:35,942 - INFO - Processing document 4_2024-09-03
2025-11-14 16:46:35,974 - INFO - Finished converting document 4_2024-09-03 in 0.06 sec.
2025-11-14 16:46:36,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:36,036 - INFO - Going to convert document batch...
2025-11-14 16:46:36,037 - INFO - Processing document 4_2024-09-05
2025-11-14 16:46:36,070 - INFO - Finished converting document 4_2024-09-05 in 0.06 sec.
2025-11-14 16:46:36,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:36,122 - INFO - Going to convert document batch...
2025-11-14 16:46:36,123 - INFO - Processing document 4_2024-09-06
2025-11-14 16:46:36,148 - INFO - Finished converting document 4_2024-09-06 in 0.05 sec.
2025-11-14 16:46:36,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-09-03' --> 'data\processed_data\GOOGL\4_2024-09-03.md'
Converted 'data\edgar_documents\GOOGL\4_2024-09-05' --> 'data\processed_data\GOOGL\4_2024-09-05.md'
Converted 'data\edgar_documents\GOOGL\4_2024-09-06' --> 'data\processed_data\GOOGL\4_2024-09-06.md'


2025-11-14 16:46:36,198 - INFO - Going to convert document batch...
2025-11-14 16:46:36,200 - INFO - Processing document 4_2024-09-10
2025-11-14 16:46:36,224 - INFO - Finished converting document 4_2024-09-10 in 0.05 sec.
2025-11-14 16:46:36,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:36,285 - INFO - Going to convert document batch...
2025-11-14 16:46:36,286 - INFO - Processing document 4_2024-09-16
2025-11-14 16:46:36,314 - INFO - Finished converting document 4_2024-09-16 in 0.06 sec.
2025-11-14 16:46:36,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:36,368 - INFO - Going to convert document batch...
2025-11-14 16:46:36,368 - INFO - Processing document 4_2024-09-17
2025-11-14 16:46:36,395 - INFO - Finished converting document 4_2024-09-17 in 0.05 sec.
2025-11-14 16:46:36,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-09-10' --> 'data\processed_data\GOOGL\4_2024-09-10.md'
Converted 'data\edgar_documents\GOOGL\4_2024-09-16' --> 'data\processed_data\GOOGL\4_2024-09-16.md'
Converted 'data\edgar_documents\GOOGL\4_2024-09-17' --> 'data\processed_data\GOOGL\4_2024-09-17.md'


2025-11-14 16:46:36,460 - INFO - Going to convert document batch...
2025-11-14 16:46:36,461 - INFO - Processing document 4_2024-09-18
2025-11-14 16:46:36,850 - INFO - Finished converting document 4_2024-09-18 in 0.42 sec.
2025-11-14 16:46:36,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:36,917 - INFO - Going to convert document batch...
2025-11-14 16:46:36,919 - INFO - Processing document 4_2024-09-24
2025-11-14 16:46:36,944 - INFO - Finished converting document 4_2024-09-24 in 0.05 sec.
2025-11-14 16:46:36,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:36,997 - INFO - Going to convert document batch...
2025-11-14 16:46:36,998 - INFO - Processing document 4_2024-09-26
2025-11-14 16:46:37,034 - INFO - Finished converting document 4_2024-09-26 in 0.06 sec.
2025-11-14 16:46:37,076 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-09-18' --> 'data\processed_data\GOOGL\4_2024-09-18.md'
Converted 'data\edgar_documents\GOOGL\4_2024-09-24' --> 'data\processed_data\GOOGL\4_2024-09-24.md'
Converted 'data\edgar_documents\GOOGL\4_2024-09-26' --> 'data\processed_data\GOOGL\4_2024-09-26.md'


2025-11-14 16:46:37,091 - INFO - Going to convert document batch...
2025-11-14 16:46:37,092 - INFO - Processing document 4_2024-09-27
2025-11-14 16:46:37,135 - INFO - Finished converting document 4_2024-09-27 in 0.08 sec.
2025-11-14 16:46:37,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:37,233 - INFO - Going to convert document batch...
2025-11-14 16:46:37,233 - INFO - Processing document 4_2024-09-30
2025-11-14 16:46:37,264 - INFO - Finished converting document 4_2024-09-30 in 0.09 sec.
2025-11-14 16:46:37,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:37,315 - INFO - Going to convert document batch...
2025-11-14 16:46:37,316 - INFO - Processing document 4_2024-10-02
2025-11-14 16:46:37,346 - INFO - Finished converting document 4_2024-10-02 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-09-27' --> 'data\processed_data\GOOGL\4_2024-09-27.md'
Converted 'data\edgar_documents\GOOGL\4_2024-09-30' --> 'data\processed_data\GOOGL\4_2024-09-30.md'
Converted 'data\edgar_documents\GOOGL\4_2024-10-02' --> 'data\processed_data\GOOGL\4_2024-10-02.md'


2025-11-14 16:46:37,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:37,423 - INFO - Going to convert document batch...
2025-11-14 16:46:37,452 - INFO - Processing document 4_2024-10-15
2025-11-14 16:46:37,553 - INFO - Finished converting document 4_2024-10-15 in 0.17 sec.
2025-11-14 16:46:37,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:37,661 - INFO - Going to convert document batch...
2025-11-14 16:46:37,663 - INFO - Processing document 4_2024-10-16
2025-11-14 16:46:37,702 - INFO - Finished converting document 4_2024-10-16 in 0.11 sec.
2025-11-14 16:46:37,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:37,758 - INFO - Going to convert document batch...
2025-11-14 16:46:37,759 - INFO - Processing document 4_2024-10-28
2025-11-14 16:46:37,782 - INFO - Finished converting document 4_2024-10-28 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-10-15' --> 'data\processed_data\GOOGL\4_2024-10-15.md'
Converted 'data\edgar_documents\GOOGL\4_2024-10-16' --> 'data\processed_data\GOOGL\4_2024-10-16.md'


2025-11-14 16:46:37,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:37,840 - INFO - Going to convert document batch...
2025-11-14 16:46:37,841 - INFO - Processing document 4_2024-11-01
2025-11-14 16:46:37,887 - INFO - Finished converting document 4_2024-11-01 in 0.09 sec.
2025-11-14 16:46:37,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:37,953 - INFO - Going to convert document batch...
2025-11-14 16:46:37,954 - INFO - Processing document 4_2024-11-04
2025-11-14 16:46:37,977 - INFO - Finished converting document 4_2024-11-04 in 0.05 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-10-28' --> 'data\processed_data\GOOGL\4_2024-10-28.md'
Converted 'data\edgar_documents\GOOGL\4_2024-11-01' --> 'data\processed_data\GOOGL\4_2024-11-01.md'


2025-11-14 16:46:38,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:38,032 - INFO - Going to convert document batch...
2025-11-14 16:46:38,033 - INFO - Processing document 4_2024-11-06
2025-11-14 16:46:38,146 - INFO - Finished converting document 4_2024-11-06 in 0.14 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-11-04' --> 'data\processed_data\GOOGL\4_2024-11-04.md'


2025-11-14 16:46:38,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:38,228 - INFO - Going to convert document batch...
2025-11-14 16:46:38,230 - INFO - Processing document 4_2024-11-07
2025-11-14 16:46:38,274 - INFO - Finished converting document 4_2024-11-07 in 0.08 sec.
2025-11-14 16:46:38,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:38,335 - INFO - Going to convert document batch...
2025-11-14 16:46:38,335 - INFO - Processing document 4_2024-11-12
2025-11-14 16:46:38,368 - INFO - Finished converting document 4_2024-11-12 in 0.05 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-11-06' --> 'data\processed_data\GOOGL\4_2024-11-06.md'
Converted 'data\edgar_documents\GOOGL\4_2024-11-07' --> 'data\processed_data\GOOGL\4_2024-11-07.md'


2025-11-14 16:46:38,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:38,548 - INFO - Going to convert document batch...
2025-11-14 16:46:38,549 - INFO - Processing document 4_2024-11-18
2025-11-14 16:46:38,578 - INFO - Finished converting document 4_2024-11-18 in 0.09 sec.
2025-11-14 16:46:38,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:38,650 - INFO - Going to convert document batch...
2025-11-14 16:46:38,651 - INFO - Processing document 4_2024-11-21


Converted 'data\edgar_documents\GOOGL\4_2024-11-12' --> 'data\processed_data\GOOGL\4_2024-11-12.md'
Converted 'data\edgar_documents\GOOGL\4_2024-11-18' --> 'data\processed_data\GOOGL\4_2024-11-18.md'


2025-11-14 16:46:38,679 - INFO - Finished converting document 4_2024-11-21 in 0.06 sec.
2025-11-14 16:46:38,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:38,744 - INFO - Going to convert document batch...
2025-11-14 16:46:38,745 - INFO - Processing document 4_2024-11-26
2025-11-14 16:46:38,779 - INFO - Finished converting document 4_2024-11-26 in 0.06 sec.
2025-11-14 16:46:38,820 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:38,832 - INFO - Going to convert document batch...
2025-11-14 16:46:38,832 - INFO - Processing document 4_2024-12-02
2025-11-14 16:46:38,859 - INFO - Finished converting document 4_2024-12-02 in 0.05 sec.
2025-11-14 16:46:38,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2024-11-21' --> 'data\processed_data\GOOGL\4_2024-11-21.md'
Converted 'data\edgar_documents\GOOGL\4_2024-11-26' --> 'data\processed_data\GOOGL\4_2024-11-26.md'
Converted 'data\edgar_documents\GOOGL\4_2024-12-02' --> 'data\processed_data\GOOGL\4_2024-12-02.md'


2025-11-14 16:46:38,912 - INFO - Going to convert document batch...
2025-11-14 16:46:38,913 - INFO - Processing document 4_2024-12-04
2025-11-14 16:46:38,943 - INFO - Finished converting document 4_2024-12-04 in 0.05 sec.
2025-11-14 16:46:38,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:39,003 - INFO - Going to convert document batch...
2025-11-14 16:46:39,004 - INFO - Processing document 4_2024-12-10
2025-11-14 16:46:39,041 - INFO - Finished converting document 4_2024-12-10 in 0.06 sec.
2025-11-14 16:46:39,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:39,114 - INFO - Going to convert document batch...
2025-11-14 16:46:39,115 - INFO - Processing document 4_2024-12-13
2025-11-14 16:46:39,144 - INFO - Finished converting document 4_2024-12-13 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-12-04' --> 'data\processed_data\GOOGL\4_2024-12-04.md'
Converted 'data\edgar_documents\GOOGL\4_2024-12-10' --> 'data\processed_data\GOOGL\4_2024-12-10.md'
Converted 'data\edgar_documents\GOOGL\4_2024-12-13' --> 'data\processed_data\GOOGL\4_2024-12-13.md'


2025-11-14 16:46:39,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:39,202 - INFO - Going to convert document batch...
2025-11-14 16:46:39,203 - INFO - Processing document 4_2024-12-17
2025-11-14 16:46:39,259 - INFO - Finished converting document 4_2024-12-17 in 0.08 sec.
2025-11-14 16:46:39,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:39,366 - INFO - Going to convert document batch...
2025-11-14 16:46:39,367 - INFO - Processing document 4_2024-12-18
2025-11-14 16:46:39,421 - INFO - Finished converting document 4_2024-12-18 in 0.12 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-12-17' --> 'data\processed_data\GOOGL\4_2024-12-17.md'
Converted 'data\edgar_documents\GOOGL\4_2024-12-18' --> 'data\processed_data\GOOGL\4_2024-12-18.md'


2025-11-14 16:46:39,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:39,541 - INFO - Going to convert document batch...
2025-11-14 16:46:39,542 - INFO - Processing document 4_2024-12-27
2025-11-14 16:46:39,582 - INFO - Finished converting document 4_2024-12-27 in 0.11 sec.
2025-11-14 16:46:39,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:39,648 - INFO - Going to convert document batch...
2025-11-14 16:46:39,649 - INFO - Processing document 4_2025-01-02
2025-11-14 16:46:39,688 - INFO - Finished converting document 4_2025-01-02 in 0.08 sec.
2025-11-14 16:46:39,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:39,750 - INFO - Going to convert document batch...
2025-11-14 16:46:39,751 - INFO - Processing document 4_2025-01-03
2025-11-14 16:46:39,786 - INFO - Finished converting document 4_2025-01-03 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2024-12-27' --> 'data\processed_data\GOOGL\4_2024-12-27.md'
Converted 'data\edgar_documents\GOOGL\4_2025-01-02' --> 'data\processed_data\GOOGL\4_2025-01-02.md'
Converted 'data\edgar_documents\GOOGL\4_2025-01-03' --> 'data\processed_data\GOOGL\4_2025-01-03.md'


2025-11-14 16:46:39,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:39,856 - INFO - Going to convert document batch...
2025-11-14 16:46:39,857 - INFO - Processing document 4_2025-01-10
2025-11-14 16:46:39,890 - INFO - Finished converting document 4_2025-01-10 in 0.08 sec.
2025-11-14 16:46:39,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:40,005 - INFO - Going to convert document batch...
2025-11-14 16:46:40,007 - INFO - Processing document 4_2025-01-13
2025-11-14 16:46:40,042 - INFO - Finished converting document 4_2025-01-13 in 0.11 sec.
2025-11-14 16:46:40,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:40,097 - INFO - Going to convert document batch...
2025-11-14 16:46:40,098 - INFO - Processing document 4_2025-01-15
2025-11-14 16:46:40,126 - INFO - Finished converting document 4_2025-01-15 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-01-10' --> 'data\processed_data\GOOGL\4_2025-01-10.md'
Converted 'data\edgar_documents\GOOGL\4_2025-01-13' --> 'data\processed_data\GOOGL\4_2025-01-13.md'


2025-11-14 16:46:40,167 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:40,184 - INFO - Going to convert document batch...
2025-11-14 16:46:40,185 - INFO - Processing document 4_2025-01-24
2025-11-14 16:46:40,220 - INFO - Finished converting document 4_2025-01-24 in 0.06 sec.
2025-11-14 16:46:40,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:40,300 - INFO - Going to convert document batch...
2025-11-14 16:46:40,301 - INFO - Processing document 4_2025-01-28
2025-11-14 16:46:40,334 - INFO - Finished converting document 4_2025-01-28 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-01-15' --> 'data\processed_data\GOOGL\4_2025-01-15.md'
Converted 'data\edgar_documents\GOOGL\4_2025-01-24' --> 'data\processed_data\GOOGL\4_2025-01-24.md'


2025-11-14 16:46:40,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:40,397 - INFO - Going to convert document batch...
2025-11-14 16:46:40,399 - INFO - Processing document 4_2025-01-30
2025-11-14 16:46:40,435 - INFO - Finished converting document 4_2025-01-30 in 0.08 sec.
2025-11-14 16:46:40,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:40,519 - INFO - Going to convert document batch...
2025-11-14 16:46:40,519 - INFO - Processing document 4_2025-01-31


Converted 'data\edgar_documents\GOOGL\4_2025-01-28' --> 'data\processed_data\GOOGL\4_2025-01-28.md'
Converted 'data\edgar_documents\GOOGL\4_2025-01-30' --> 'data\processed_data\GOOGL\4_2025-01-30.md'


2025-11-14 16:46:40,561 - INFO - Finished converting document 4_2025-01-31 in 0.09 sec.
2025-11-14 16:46:40,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:40,659 - INFO - Going to convert document batch...
2025-11-14 16:46:40,660 - INFO - Processing document 4_2025-02-03
2025-11-14 16:46:40,690 - INFO - Finished converting document 4_2025-02-03 in 0.09 sec.
2025-11-14 16:46:40,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:40,743 - INFO - Going to convert document batch...
2025-11-14 16:46:40,744 - INFO - Processing document 4_2025-02-13
2025-11-14 16:46:40,791 - INFO - Finished converting document 4_2025-02-13 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-01-31' --> 'data\processed_data\GOOGL\4_2025-01-31.md'
Converted 'data\edgar_documents\GOOGL\4_2025-02-03' --> 'data\processed_data\GOOGL\4_2025-02-03.md'
Converted 'data\edgar_documents\GOOGL\4_2025-02-13' --> 'data\processed_data\GOOGL\4_2025-02-13.md'


2025-11-14 16:46:41,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:41,175 - INFO - Going to convert document batch...
2025-11-14 16:46:41,176 - INFO - Processing document 4_2025-02-19
2025-11-14 16:46:41,226 - INFO - Finished converting document 4_2025-02-19 in 0.39 sec.
2025-11-14 16:46:41,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:41,296 - INFO - Going to convert document batch...
2025-11-14 16:46:41,297 - INFO - Processing document 4_2025-02-20
2025-11-14 16:46:41,328 - INFO - Finished converting document 4_2025-02-20 in 0.06 sec.
2025-11-14 16:46:41,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:41,387 - INFO - Going to convert document batch...
2025-11-14 16:46:41,389 - INFO - Processing document 4_2025-02-21
2025-11-14 16:46:41,427 - INFO - Finished converting document 4_2025-02-21 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-02-19' --> 'data\processed_data\GOOGL\4_2025-02-19.md'
Converted 'data\edgar_documents\GOOGL\4_2025-02-20' --> 'data\processed_data\GOOGL\4_2025-02-20.md'
Converted 'data\edgar_documents\GOOGL\4_2025-02-21' --> 'data\processed_data\GOOGL\4_2025-02-21.md'


2025-11-14 16:46:41,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:41,492 - INFO - Going to convert document batch...
2025-11-14 16:46:41,493 - INFO - Processing document 4_2025-02-26
2025-11-14 16:46:41,823 - INFO - Finished converting document 4_2025-02-26 in 0.38 sec.
2025-11-14 16:46:41,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:41,915 - INFO - Going to convert document batch...
2025-11-14 16:46:41,916 - INFO - Processing document 4_2025-02-28
2025-11-14 16:46:41,953 - INFO - Finished converting document 4_2025-02-28 in 0.09 sec.
2025-11-14 16:46:41,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:42,007 - INFO - Going to convert document batch...
2025-11-14 16:46:42,008 - INFO - Processing document 4_2025-03-03
2025-11-14 16:46:42,034 - INFO - Finished converting document 4_2025-03-03 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-02-26' --> 'data\processed_data\GOOGL\4_2025-02-26.md'
Converted 'data\edgar_documents\GOOGL\4_2025-02-28' --> 'data\processed_data\GOOGL\4_2025-02-28.md'
Converted 'data\edgar_documents\GOOGL\4_2025-03-03' --> 'data\processed_data\GOOGL\4_2025-03-03.md'


2025-11-14 16:46:42,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:42,094 - INFO - Going to convert document batch...
2025-11-14 16:46:42,095 - INFO - Processing document 4_2025-03-07
2025-11-14 16:46:42,124 - INFO - Finished converting document 4_2025-03-07 in 0.08 sec.
2025-11-14 16:46:42,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:42,180 - INFO - Going to convert document batch...
2025-11-14 16:46:42,180 - INFO - Processing document 4_2025-03-13
2025-11-14 16:46:42,208 - INFO - Finished converting document 4_2025-03-13 in 0.05 sec.
2025-11-14 16:46:42,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:42,257 - INFO - Going to convert document batch...
2025-11-14 16:46:42,258 - INFO - Processing document 4_2025-03-18
2025-11-14 16:46:42,290 - INFO - Finished converting document 4_2025-03-18 in 0.05 sec.
2025-11-14 16:46:42,329 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GOOGL\4_2025-03-07' --> 'data\processed_data\GOOGL\4_2025-03-07.md'
Converted 'data\edgar_documents\GOOGL\4_2025-03-13' --> 'data\processed_data\GOOGL\4_2025-03-13.md'
Converted 'data\edgar_documents\GOOGL\4_2025-03-18' --> 'data\processed_data\GOOGL\4_2025-03-18.md'


2025-11-14 16:46:42,342 - INFO - Processing document 4_2025-03-19
2025-11-14 16:46:42,467 - INFO - Finished converting document 4_2025-03-19 in 0.16 sec.
2025-11-14 16:46:42,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:42,589 - INFO - Going to convert document batch...
2025-11-14 16:46:42,591 - INFO - Processing document 4_2025-03-26
2025-11-14 16:46:42,627 - INFO - Finished converting document 4_2025-03-26 in 0.11 sec.
2025-11-14 16:46:42,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:42,691 - INFO - Going to convert document batch...
2025-11-14 16:46:42,691 - INFO - Processing document 4_2025-03-27


Converted 'data\edgar_documents\GOOGL\4_2025-03-19' --> 'data\processed_data\GOOGL\4_2025-03-19.md'
Converted 'data\edgar_documents\GOOGL\4_2025-03-26' --> 'data\processed_data\GOOGL\4_2025-03-26.md'


2025-11-14 16:46:42,718 - INFO - Finished converting document 4_2025-03-27 in 0.06 sec.
2025-11-14 16:46:42,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:42,776 - INFO - Going to convert document batch...
2025-11-14 16:46:42,777 - INFO - Processing document 4_2025-03-31
2025-11-14 16:46:42,802 - INFO - Finished converting document 4_2025-03-31 in 0.05 sec.
2025-11-14 16:46:42,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:42,863 - INFO - Going to convert document batch...
2025-11-14 16:46:42,864 - INFO - Processing document 4_2025-04-01
2025-11-14 16:46:42,884 - INFO - Finished converting document 4_2025-04-01 in 0.05 sec.
2025-11-14 16:46:42,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:42,935 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GOOGL\4_2025-03-27' --> 'data\processed_data\GOOGL\4_2025-03-27.md'
Converted 'data\edgar_documents\GOOGL\4_2025-03-31' --> 'data\processed_data\GOOGL\4_2025-03-31.md'
Converted 'data\edgar_documents\GOOGL\4_2025-04-01' --> 'data\processed_data\GOOGL\4_2025-04-01.md'


2025-11-14 16:46:42,935 - INFO - Processing document 4_2025-04-04
2025-11-14 16:46:42,974 - INFO - Finished converting document 4_2025-04-04 in 0.06 sec.
2025-11-14 16:46:43,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:43,032 - INFO - Going to convert document batch...
2025-11-14 16:46:43,033 - INFO - Processing document 4_2025-04-14
2025-11-14 16:46:43,065 - INFO - Finished converting document 4_2025-04-14 in 0.06 sec.
2025-11-14 16:46:43,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:43,119 - INFO - Going to convert document batch...
2025-11-14 16:46:43,120 - INFO - Processing document 4_2025-04-18
2025-11-14 16:46:43,148 - INFO - Finished converting document 4_2025-04-18 in 0.05 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-04-04' --> 'data\processed_data\GOOGL\4_2025-04-04.md'
Converted 'data\edgar_documents\GOOGL\4_2025-04-14' --> 'data\processed_data\GOOGL\4_2025-04-14.md'
Converted 'data\edgar_documents\GOOGL\4_2025-04-18' --> 'data\processed_data\GOOGL\4_2025-04-18.md'


2025-11-14 16:46:43,219 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:46:43,220 - ERROR - Input document 4_2025-04-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:46:43,221 - INFO - Going to convert document batch...
2025-11-14 16:46:43,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:43,266 - INFO - Going to convert document batch...
2025-11-14 16:46:43,268 - INFO - Processing document 4_2025-04-29
2025-11-14 16:46:43,314 - INFO - Fin

Error processing data\edgar_documents\GOOGL\4_2025-04-28: File format not allowed: data\edgar_documents\GOOGL\4_2025-04-28
Converted 'data\edgar_documents\GOOGL\4_2025-04-29' --> 'data\processed_data\GOOGL\4_2025-04-29.md'


2025-11-14 16:46:43,420 - ERROR - Input document 4_2025-04-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:46:43,422 - INFO - Going to convert document batch...
2025-11-14 16:46:43,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:43,445 - INFO - Going to convert document batch...
2025-11-14 16:46:43,446 - INFO - Processing document 4_2025-05-01
2025-11-14 16:46:43,476 - INFO - Finished converting document 4_2025-05-01 in 0.05 sec.
2025-11-14 16:46:43,516 - INFO - detec

Error processing data\edgar_documents\GOOGL\4_2025-04-30: File format not allowed: data\edgar_documents\GOOGL\4_2025-04-30
Converted 'data\edgar_documents\GOOGL\4_2025-05-01' --> 'data\processed_data\GOOGL\4_2025-05-01.md'


2025-11-14 16:46:43,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:43,634 - INFO - Going to convert document batch...
2025-11-14 16:46:43,635 - INFO - Processing document 4_2025-05-15
2025-11-14 16:46:43,671 - INFO - Finished converting document 4_2025-05-15 in 0.06 sec.
2025-11-14 16:46:43,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:43,728 - INFO - Going to convert document batch...
2025-11-14 16:46:43,729 - INFO - Processing document 4_2025-05-19
2025-11-14 16:46:43,772 - INFO - Finished converting document 4_2025-05-19 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-05-09' --> 'data\processed_data\GOOGL\4_2025-05-09.md'
Converted 'data\edgar_documents\GOOGL\4_2025-05-15' --> 'data\processed_data\GOOGL\4_2025-05-15.md'


2025-11-14 16:46:43,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:43,877 - INFO - Going to convert document batch...
2025-11-14 16:46:43,878 - INFO - Processing document 4_2025-05-21
2025-11-14 16:46:43,913 - INFO - Finished converting document 4_2025-05-21 in 0.09 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-05-19' --> 'data\processed_data\GOOGL\4_2025-05-19.md'


2025-11-14 16:46:44,076 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:44,092 - INFO - Going to convert document batch...
2025-11-14 16:46:44,093 - INFO - Processing document 4_2025-05-23
2025-11-14 16:46:44,128 - INFO - Finished converting document 4_2025-05-23 in 0.09 sec.
2025-11-14 16:46:44,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:44,188 - INFO - Going to convert document batch...
2025-11-14 16:46:44,189 - INFO - Processing document 4_2025-05-28
2025-11-14 16:46:44,215 - INFO - Finished converting document 4_2025-05-28 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-05-21' --> 'data\processed_data\GOOGL\4_2025-05-21.md'
Converted 'data\edgar_documents\GOOGL\4_2025-05-23' --> 'data\processed_data\GOOGL\4_2025-05-23.md'


2025-11-14 16:46:44,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:44,265 - INFO - Going to convert document batch...
2025-11-14 16:46:44,266 - INFO - Processing document 4_2025-06-02
2025-11-14 16:46:44,393 - INFO - Finished converting document 4_2025-06-02 in 0.16 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-05-28' --> 'data\processed_data\GOOGL\4_2025-05-28.md'


2025-11-14 16:46:44,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:44,486 - INFO - Going to convert document batch...
2025-11-14 16:46:44,487 - INFO - Processing document 4_2025-06-04
2025-11-14 16:46:44,515 - INFO - Finished converting document 4_2025-06-04 in 0.09 sec.
2025-11-14 16:46:44,558 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:44,571 - INFO - Going to convert document batch...
2025-11-14 16:46:44,572 - INFO - Processing document 4_2025-06-17
2025-11-14 16:46:44,602 - INFO - Finished converting document 4_2025-06-17 in 0.05 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-06-02' --> 'data\processed_data\GOOGL\4_2025-06-02.md'
Converted 'data\edgar_documents\GOOGL\4_2025-06-04' --> 'data\processed_data\GOOGL\4_2025-06-04.md'


2025-11-14 16:46:44,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:44,658 - INFO - Going to convert document batch...
2025-11-14 16:46:44,659 - INFO - Processing document 4_2025-06-18
2025-11-14 16:46:44,776 - INFO - Finished converting document 4_2025-06-18 in 0.16 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-06-17' --> 'data\processed_data\GOOGL\4_2025-06-17.md'
Converted 'data\edgar_documents\GOOGL\4_2025-06-18' --> 'data\processed_data\GOOGL\4_2025-06-18.md'


2025-11-14 16:46:44,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:44,849 - INFO - Going to convert document batch...
2025-11-14 16:46:44,850 - INFO - Processing document 4_2025-06-20
2025-11-14 16:46:44,887 - INFO - Finished converting document 4_2025-06-20 in 0.06 sec.
2025-11-14 16:46:44,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:44,954 - INFO - Going to convert document batch...
2025-11-14 16:46:44,955 - INFO - Processing document 4_2025-06-27
2025-11-14 16:46:44,985 - INFO - Finished converting document 4_2025-06-27 in 0.06 sec.
2025-11-14 16:46:45,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:45,059 - INFO - Going to convert document batch...
2025-11-14 16:46:45,059 - INFO - Processing document 4_2025-06-30
2025-11-14 16:46:45,084 - INFO - Finished converting document 4_2025-06-30 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-06-20' --> 'data\processed_data\GOOGL\4_2025-06-20.md'
Converted 'data\edgar_documents\GOOGL\4_2025-06-27' --> 'data\processed_data\GOOGL\4_2025-06-27.md'
Converted 'data\edgar_documents\GOOGL\4_2025-06-30' --> 'data\processed_data\GOOGL\4_2025-06-30.md'


2025-11-14 16:46:45,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:45,139 - INFO - Going to convert document batch...
2025-11-14 16:46:45,141 - INFO - Processing document 4_2025-07-03
2025-11-14 16:46:45,171 - INFO - Finished converting document 4_2025-07-03 in 0.06 sec.
2025-11-14 16:46:45,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:45,223 - INFO - Going to convert document batch...
2025-11-14 16:46:45,224 - INFO - Processing document 4_2025-07-11
2025-11-14 16:46:45,247 - INFO - Finished converting document 4_2025-07-11 in 0.05 sec.
2025-11-14 16:46:45,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:45,297 - INFO - Going to convert document batch...
2025-11-14 16:46:45,298 - INFO - Processing document 4_2025-07-16
2025-11-14 16:46:45,330 - INFO - Finished converting document 4_2025-07-16 in 0.06 sec.
2025-11-14 16:46:45,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\GOOGL\4_2025-07-03' --> 'data\processed_data\GOOGL\4_2025-07-03.md'
Converted 'data\edgar_documents\GOOGL\4_2025-07-11' --> 'data\processed_data\GOOGL\4_2025-07-11.md'
Converted 'data\edgar_documents\GOOGL\4_2025-07-16' --> 'data\processed_data\GOOGL\4_2025-07-16.md'


2025-11-14 16:46:45,389 - INFO - Processing document 4_2025-07-17
2025-11-14 16:46:45,428 - INFO - Finished converting document 4_2025-07-17 in 0.06 sec.
2025-11-14 16:46:45,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:45,515 - INFO - Going to convert document batch...
2025-11-14 16:46:45,516 - INFO - Processing document 4_2025-07-21
2025-11-14 16:46:45,559 - INFO - Finished converting document 4_2025-07-21 in 0.09 sec.
2025-11-14 16:46:45,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:45,617 - INFO - Going to convert document batch...
2025-11-14 16:46:45,618 - INFO - Processing document 4_2025-07-28
2025-11-14 16:46:45,649 - INFO - Finished converting document 4_2025-07-28 in 0.05 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-07-17' --> 'data\processed_data\GOOGL\4_2025-07-17.md'
Converted 'data\edgar_documents\GOOGL\4_2025-07-21' --> 'data\processed_data\GOOGL\4_2025-07-21.md'
Converted 'data\edgar_documents\GOOGL\4_2025-07-28' --> 'data\processed_data\GOOGL\4_2025-07-28.md'


2025-11-14 16:46:45,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:45,715 - INFO - Going to convert document batch...
2025-11-14 16:46:45,715 - INFO - Processing document 4_2025-07-31
2025-11-14 16:46:45,745 - INFO - Finished converting document 4_2025-07-31 in 0.08 sec.
2025-11-14 16:46:45,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:45,808 - INFO - Going to convert document batch...
2025-11-14 16:46:45,809 - INFO - Processing document 4_2025-08-05
2025-11-14 16:46:45,848 - INFO - Finished converting document 4_2025-08-05 in 0.06 sec.
2025-11-14 16:46:45,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:45,912 - INFO - Going to convert document batch...
2025-11-14 16:46:45,913 - INFO - Processing document 4_2025-08-06
2025-11-14 16:46:45,941 - INFO - Finished converting document 4_2025-08-06 in 0.05 sec.
2025-11-14 16:46:45,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2025-07-31' --> 'data\processed_data\GOOGL\4_2025-07-31.md'
Converted 'data\edgar_documents\GOOGL\4_2025-08-05' --> 'data\processed_data\GOOGL\4_2025-08-05.md'
Converted 'data\edgar_documents\GOOGL\4_2025-08-06' --> 'data\processed_data\GOOGL\4_2025-08-06.md'


2025-11-14 16:46:45,992 - INFO - Going to convert document batch...
2025-11-14 16:46:45,993 - INFO - Processing document 4_2025-08-07
2025-11-14 16:46:46,026 - INFO - Finished converting document 4_2025-08-07 in 0.06 sec.
2025-11-14 16:46:46,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:46,079 - INFO - Going to convert document batch...
2025-11-14 16:46:46,079 - INFO - Processing document 4_2025-08-11
2025-11-14 16:46:46,106 - INFO - Finished converting document 4_2025-08-11 in 0.05 sec.
2025-11-14 16:46:46,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:46,161 - INFO - Going to convert document batch...
2025-11-14 16:46:46,163 - INFO - Processing document 4_2025-08-14
2025-11-14 16:46:46,200 - INFO - Finished converting document 4_2025-08-14 in 0.08 sec.
2025-11-14 16:46:46,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2025-08-07' --> 'data\processed_data\GOOGL\4_2025-08-07.md'
Converted 'data\edgar_documents\GOOGL\4_2025-08-11' --> 'data\processed_data\GOOGL\4_2025-08-11.md'
Converted 'data\edgar_documents\GOOGL\4_2025-08-14' --> 'data\processed_data\GOOGL\4_2025-08-14.md'


2025-11-14 16:46:46,561 - INFO - Going to convert document batch...
2025-11-14 16:46:46,561 - INFO - Processing document 4_2025-08-18
2025-11-14 16:46:46,711 - INFO - Finished converting document 4_2025-08-18 in 0.47 sec.
2025-11-14 16:46:46,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:46,767 - INFO - Going to convert document batch...
2025-11-14 16:46:46,768 - INFO - Processing document 4_2025-08-21
2025-11-14 16:46:46,788 - INFO - Finished converting document 4_2025-08-21 in 0.03 sec.
2025-11-14 16:46:46,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:46,835 - INFO - Going to convert document batch...
2025-11-14 16:46:46,836 - INFO - Processing document 4_2025-08-26
2025-11-14 16:46:46,861 - INFO - Finished converting document 4_2025-08-26 in 0.05 sec.
2025-11-14 16:46:46,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:46,908 - INFO - Going to convert document batch...
2025-11-14 16:46:46,909 - 

Converted 'data\edgar_documents\GOOGL\4_2025-08-18' --> 'data\processed_data\GOOGL\4_2025-08-18.md'
Converted 'data\edgar_documents\GOOGL\4_2025-08-21' --> 'data\processed_data\GOOGL\4_2025-08-21.md'
Converted 'data\edgar_documents\GOOGL\4_2025-08-26' --> 'data\processed_data\GOOGL\4_2025-08-26.md'


2025-11-14 16:46:46,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:46,991 - INFO - Going to convert document batch...
2025-11-14 16:46:46,992 - INFO - Processing document 4_2025-09-05
2025-11-14 16:46:47,026 - INFO - Finished converting document 4_2025-09-05 in 0.08 sec.
2025-11-14 16:46:47,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:47,084 - INFO - Going to convert document batch...
2025-11-14 16:46:47,085 - INFO - Processing document 4_2025-09-16
2025-11-14 16:46:47,108 - INFO - Finished converting document 4_2025-09-16 in 0.05 sec.
2025-11-14 16:46:47,161 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\4_2025-08-29' --> 'data\processed_data\GOOGL\4_2025-08-29.md'
Converted 'data\edgar_documents\GOOGL\4_2025-09-05' --> 'data\processed_data\GOOGL\4_2025-09-05.md'
Converted 'data\edgar_documents\GOOGL\4_2025-09-16' --> 'data\processed_data\GOOGL\4_2025-09-16.md'


2025-11-14 16:46:47,180 - INFO - Going to convert document batch...
2025-11-14 16:46:47,182 - INFO - Processing document 4_2025-09-17
2025-11-14 16:46:47,224 - INFO - Finished converting document 4_2025-09-17 in 0.09 sec.
2025-11-14 16:46:47,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:47,385 - INFO - Going to convert document batch...
2025-11-14 16:46:47,385 - INFO - Processing document 4_2025-09-29
2025-11-14 16:46:47,420 - INFO - Finished converting document 4_2025-09-29 in 0.09 sec.
2025-11-14 16:46:47,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:47,482 - INFO - Going to convert document batch...
2025-11-14 16:46:47,484 - INFO - Processing document 4_2025-09-30
2025-11-14 16:46:47,511 - INFO - Finished converting document 4_2025-09-30 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-09-17' --> 'data\processed_data\GOOGL\4_2025-09-17.md'
Converted 'data\edgar_documents\GOOGL\4_2025-09-29' --> 'data\processed_data\GOOGL\4_2025-09-29.md'


2025-11-14 16:46:47,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:47,578 - INFO - Going to convert document batch...
2025-11-14 16:46:47,580 - INFO - Processing document 4_2025-10-01
2025-11-14 16:46:47,626 - INFO - Finished converting document 4_2025-10-01 in 0.08 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-09-30' --> 'data\processed_data\GOOGL\4_2025-09-30.md'
Converted 'data\edgar_documents\GOOGL\4_2025-10-01' --> 'data\processed_data\GOOGL\4_2025-10-01.md'


2025-11-14 16:46:47,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:47,772 - INFO - Going to convert document batch...
2025-11-14 16:46:47,773 - INFO - Processing document 4_2025-10-02
2025-11-14 16:46:47,811 - INFO - Finished converting document 4_2025-10-02 in 0.16 sec.
2025-11-14 16:46:47,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:47,911 - INFO - Going to convert document batch...
2025-11-14 16:46:47,911 - INFO - Processing document 4_2025-10-15
2025-11-14 16:46:47,944 - INFO - Finished converting document 4_2025-10-15 in 0.09 sec.
2025-11-14 16:46:47,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:48,000 - INFO - Going to convert document batch...
2025-11-14 16:46:48,001 - INFO - Processing document 4_2025-10-17
2025-11-14 16:46:48,040 - INFO - Finished converting document 4_2025-10-17 in 0.06 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-10-02' --> 'data\processed_data\GOOGL\4_2025-10-02.md'
Converted 'data\edgar_documents\GOOGL\4_2025-10-15' --> 'data\processed_data\GOOGL\4_2025-10-15.md'


2025-11-14 16:46:48,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:48,103 - INFO - Going to convert document batch...
2025-11-14 16:46:48,104 - INFO - Processing document 4_2025-10-29
2025-11-14 16:46:48,136 - INFO - Finished converting document 4_2025-10-29 in 0.08 sec.
2025-11-14 16:46:48,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:48,254 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GOOGL\4_2025-10-17' --> 'data\processed_data\GOOGL\4_2025-10-17.md'
Converted 'data\edgar_documents\GOOGL\4_2025-10-29' --> 'data\processed_data\GOOGL\4_2025-10-29.md'


2025-11-14 16:46:48,255 - INFO - Processing document 4_2025-11-03
2025-11-14 16:46:48,295 - INFO - Finished converting document 4_2025-11-03 in 0.12 sec.
2025-11-14 16:46:48,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:48,465 - INFO - Going to convert document batch...
2025-11-14 16:46:48,466 - INFO - Processing document 4_2025-11-04
2025-11-14 16:46:48,492 - INFO - Finished converting document 4_2025-11-04 in 0.16 sec.


Converted 'data\edgar_documents\GOOGL\4_2025-11-03' --> 'data\processed_data\GOOGL\4_2025-11-03.md'


2025-11-14 16:46:48,552 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:46:48,552 - ERROR - Input document 4_2025-11-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:46:48,554 - INFO - Going to convert document batch...
2025-11-14 16:46:48,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:48,583 - INFO - Going to convert document batch...
2025-11-14 16:46:48,584 - INFO - Processing document 4_2025-11-07
2025-11-14 16:46:48,621 - INFO - Fin

Converted 'data\edgar_documents\GOOGL\4_2025-11-04' --> 'data\processed_data\GOOGL\4_2025-11-04.md'
Error processing data\edgar_documents\GOOGL\4_2025-11-05: File format not allowed: data\edgar_documents\GOOGL\4_2025-11-05
Converted 'data\edgar_documents\GOOGL\4_2025-11-07' --> 'data\processed_data\GOOGL\4_2025-11-07.md'


2025-11-14 16:46:48,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:48,743 - INFO - Going to convert document batch...
2025-11-14 16:46:48,744 - INFO - Processing document 8-K_2023-01-25
2025-11-14 16:46:48,760 - INFO - Finished converting document 8-K_2023-01-25 in 0.03 sec.
2025-11-14 16:46:48,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:48,800 - INFO - Going to convert document batch...
2025-11-14 16:46:48,801 - INFO - Processing document 8-K_2023-02-02
2025-11-14 16:46:48,820 - INFO - Finished converting document 8-K_2023-02-02 in 0.05 sec.
2025-11-14 16:46:48,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:48,855 - INFO - Going to convert document batch...
2025-11-14 16:46:48,856 - INFO - Processing document 8-K_2023-04-20
2025-11-14 16:46:48,870 - INFO - Finished converting document 8-K_2023-04-20 in 0.05 sec.
2025-11-14 16:46:48,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\GOOGL\8-K_2023-01-20' --> 'data\processed_data\GOOGL\8-K_2023-01-20.md'
Converted 'data\edgar_documents\GOOGL\8-K_2023-01-25' --> 'data\processed_data\GOOGL\8-K_2023-01-25.md'
Converted 'data\edgar_documents\GOOGL\8-K_2023-02-02' --> 'data\processed_data\GOOGL\8-K_2023-02-02.md'
Converted 'data\edgar_documents\GOOGL\8-K_2023-04-20' --> 'data\processed_data\GOOGL\8-K_2023-04-20.md'


2025-11-14 16:46:48,907 - INFO - Processing document 8-K_2023-04-21
2025-11-14 16:46:48,929 - INFO - Finished converting document 8-K_2023-04-21 in 0.05 sec.
2025-11-14 16:46:48,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:48,977 - INFO - Going to convert document batch...
2025-11-14 16:46:48,978 - INFO - Processing document 8-K_2023-04-25
2025-11-14 16:46:48,996 - INFO - Finished converting document 8-K_2023-04-25 in 0.06 sec.
2025-11-14 16:46:49,023 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,064 - INFO - Going to convert document batch...
2025-11-14 16:46:49,065 - INFO - Processing document 8-K_2023-06-08


Converted 'data\edgar_documents\GOOGL\8-K_2023-04-21' --> 'data\processed_data\GOOGL\8-K_2023-04-21.md'
Converted 'data\edgar_documents\GOOGL\8-K_2023-04-25' --> 'data\processed_data\GOOGL\8-K_2023-04-25.md'


2025-11-14 16:46:49,132 - INFO - Finished converting document 8-K_2023-06-08 in 0.12 sec.
2025-11-14 16:46:49,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,225 - INFO - Going to convert document batch...
2025-11-14 16:46:49,226 - INFO - Processing document 8-K_2023-07-25
2025-11-14 16:46:49,245 - INFO - Finished converting document 8-K_2023-07-25 in 0.09 sec.
2025-11-14 16:46:49,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,279 - INFO - Going to convert document batch...
2025-11-14 16:46:49,280 - INFO - Processing document 8-K_2023-10-24
2025-11-14 16:46:49,297 - INFO - Finished converting document 8-K_2023-10-24 in 0.05 sec.
2025-11-14 16:46:49,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,329 - INFO - Going to convert document batch...
2025-11-14 16:46:49,330 - INFO - Processing document 8-K_2024-01-30


Converted 'data\edgar_documents\GOOGL\8-K_2023-06-08' --> 'data\processed_data\GOOGL\8-K_2023-06-08.md'
Converted 'data\edgar_documents\GOOGL\8-K_2023-07-25' --> 'data\processed_data\GOOGL\8-K_2023-07-25.md'
Converted 'data\edgar_documents\GOOGL\8-K_2023-10-24' --> 'data\processed_data\GOOGL\8-K_2023-10-24.md'


2025-11-14 16:46:49,346 - INFO - Finished converting document 8-K_2024-01-30 in 0.03 sec.
2025-11-14 16:46:49,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,386 - INFO - Going to convert document batch...
2025-11-14 16:46:49,388 - INFO - Processing document 8-K_2024-02-08
2025-11-14 16:46:49,408 - INFO - Finished converting document 8-K_2024-02-08 in 0.05 sec.
2025-11-14 16:46:49,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,443 - INFO - Going to convert document batch...
2025-11-14 16:46:49,444 - INFO - Processing document 8-K_2024-04-25
2025-11-14 16:46:49,463 - INFO - Finished converting document 8-K_2024-04-25 in 0.06 sec.
2025-11-14 16:46:49,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,496 - INFO - Going to convert document batch...
2025-11-14 16:46:49,496 - INFO - Processing document 8-K_2024-06-05
2025-11-14 16:46:49,517 - INFO - Finished converting document 8-K_2024-06-05 in 0.

Converted 'data\edgar_documents\GOOGL\8-K_2024-01-30' --> 'data\processed_data\GOOGL\8-K_2024-01-30.md'
Converted 'data\edgar_documents\GOOGL\8-K_2024-02-08' --> 'data\processed_data\GOOGL\8-K_2024-02-08.md'
Converted 'data\edgar_documents\GOOGL\8-K_2024-04-25' --> 'data\processed_data\GOOGL\8-K_2024-04-25.md'
Converted 'data\edgar_documents\GOOGL\8-K_2024-06-05' --> 'data\processed_data\GOOGL\8-K_2024-06-05.md'


2025-11-14 16:46:49,561 - INFO - Going to convert document batch...
2025-11-14 16:46:49,562 - INFO - Processing document 8-K_2024-06-07
2025-11-14 16:46:49,600 - INFO - Finished converting document 8-K_2024-06-07 in 0.06 sec.
2025-11-14 16:46:49,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,665 - INFO - Going to convert document batch...
2025-11-14 16:46:49,665 - INFO - Processing document 8-K_2024-06-13
2025-11-14 16:46:49,824 - INFO - Finished converting document 8-K_2024-06-13 in 0.22 sec.


Converted 'data\edgar_documents\GOOGL\8-K_2024-06-07' --> 'data\processed_data\GOOGL\8-K_2024-06-07.md'


2025-11-14 16:46:49,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,903 - INFO - Going to convert document batch...
2025-11-14 16:46:49,904 - INFO - Processing document 8-K_2024-06-26
2025-11-14 16:46:49,935 - INFO - Finished converting document 8-K_2024-06-26 in 0.09 sec.
2025-11-14 16:46:49,968 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:49,978 - INFO - Going to convert document batch...
2025-11-14 16:46:49,978 - INFO - Processing document 8-K_2024-07-23
2025-11-14 16:46:49,999 - INFO - Finished converting document 8-K_2024-07-23 in 0.05 sec.
2025-11-14 16:46:50,023 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:50,031 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\GOOGL\8-K_2024-06-13' --> 'data\processed_data\GOOGL\8-K_2024-06-13.md'
Converted 'data\edgar_documents\GOOGL\8-K_2024-06-26' --> 'data\processed_data\GOOGL\8-K_2024-06-26.md'
Converted 'data\edgar_documents\GOOGL\8-K_2024-07-23' --> 'data\processed_data\GOOGL\8-K_2024-07-23.md'


2025-11-14 16:46:50,031 - INFO - Processing document 8-K_2024-08-06
2025-11-14 16:46:50,046 - INFO - Finished converting document 8-K_2024-08-06 in 0.03 sec.
2025-11-14 16:46:50,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:50,176 - INFO - Going to convert document batch...
2025-11-14 16:46:50,180 - INFO - Processing document 8-K_2024-09-24
2025-11-14 16:46:50,200 - INFO - Finished converting document 8-K_2024-09-24 in 0.14 sec.
2025-11-14 16:46:50,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\8-K_2024-08-06' --> 'data\processed_data\GOOGL\8-K_2024-08-06.md'
Converted 'data\edgar_documents\GOOGL\8-K_2024-09-24' --> 'data\processed_data\GOOGL\8-K_2024-09-24.md'


2025-11-14 16:46:50,283 - INFO - Going to convert document batch...
2025-11-14 16:46:50,285 - INFO - Processing document 8-K_2024-10-17
2025-11-14 16:46:50,306 - INFO - Finished converting document 8-K_2024-10-17 in 0.09 sec.
2025-11-14 16:46:50,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:50,343 - INFO - Going to convert document batch...
2025-11-14 16:46:50,344 - INFO - Processing document 8-K_2024-10-29
2025-11-14 16:46:50,360 - INFO - Finished converting document 8-K_2024-10-29 in 0.05 sec.
2025-11-14 16:46:50,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:50,394 - INFO - Going to convert document batch...
2025-11-14 16:46:50,395 - INFO - Processing document 8-K_2025-02-04
2025-11-14 16:46:50,410 - INFO - Finished converting document 8-K_2025-02-04 in 0.03 sec.
2025-11-14 16:46:50,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:50,440 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\GOOGL\8-K_2024-10-17' --> 'data\processed_data\GOOGL\8-K_2024-10-17.md'
Converted 'data\edgar_documents\GOOGL\8-K_2024-10-29' --> 'data\processed_data\GOOGL\8-K_2024-10-29.md'
Converted 'data\edgar_documents\GOOGL\8-K_2025-02-04' --> 'data\processed_data\GOOGL\8-K_2025-02-04.md'
Converted 'data\edgar_documents\GOOGL\8-K_2025-03-18' --> 'data\processed_data\GOOGL\8-K_2025-03-18.md'


2025-11-14 16:46:50,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:50,544 - INFO - Going to convert document batch...
2025-11-14 16:46:50,545 - INFO - Processing document 8-K_2025-04-24
2025-11-14 16:46:50,563 - INFO - Finished converting document 8-K_2025-04-24 in 0.05 sec.
2025-11-14 16:46:50,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:50,639 - INFO - Going to convert document batch...
2025-11-14 16:46:50,654 - INFO - Processing document 8-K_2025-05-01


Converted 'data\edgar_documents\GOOGL\8-K_2025-04-18' --> 'data\processed_data\GOOGL\8-K_2025-04-18.md'
Converted 'data\edgar_documents\GOOGL\8-K_2025-04-24' --> 'data\processed_data\GOOGL\8-K_2025-04-24.md'


2025-11-14 16:46:50,715 - INFO - Finished converting document 8-K_2025-05-01 in 0.14 sec.
2025-11-14 16:46:50,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:50,763 - INFO - Going to convert document batch...
2025-11-14 16:46:50,764 - INFO - Processing document 8-K_2025-05-06
2025-11-14 16:46:50,790 - INFO - Finished converting document 8-K_2025-05-06 in 0.05 sec.
2025-11-14 16:46:50,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:50,890 - INFO - Going to convert document batch...
2025-11-14 16:46:50,892 - INFO - Processing document 8-K_2025-06-12


Converted 'data\edgar_documents\GOOGL\8-K_2025-05-01' --> 'data\processed_data\GOOGL\8-K_2025-05-01.md'
Converted 'data\edgar_documents\GOOGL\8-K_2025-05-06' --> 'data\processed_data\GOOGL\8-K_2025-05-06.md'


2025-11-14 16:46:50,951 - INFO - Finished converting document 8-K_2025-06-12 in 0.14 sec.
2025-11-14 16:46:51,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:51,046 - INFO - Going to convert document batch...
2025-11-14 16:46:51,047 - INFO - Processing document 8-K_2025-07-18
2025-11-14 16:46:51,072 - INFO - Finished converting document 8-K_2025-07-18 in 0.09 sec.
2025-11-14 16:46:51,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:51,108 - INFO - Going to convert document batch...
2025-11-14 16:46:51,108 - INFO - Processing document 8-K_2025-07-23
2025-11-14 16:46:51,129 - INFO - Finished converting document 8-K_2025-07-23 in 0.05 sec.
2025-11-14 16:46:51,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\8-K_2025-06-12' --> 'data\processed_data\GOOGL\8-K_2025-06-12.md'
Converted 'data\edgar_documents\GOOGL\8-K_2025-07-18' --> 'data\processed_data\GOOGL\8-K_2025-07-18.md'
Converted 'data\edgar_documents\GOOGL\8-K_2025-07-23' --> 'data\processed_data\GOOGL\8-K_2025-07-23.md'


2025-11-14 16:46:51,173 - INFO - Going to convert document batch...
2025-11-14 16:46:51,174 - INFO - Processing document 8-K_2025-09-03
2025-11-14 16:46:51,198 - INFO - Finished converting document 8-K_2025-09-03 in 0.06 sec.
2025-11-14 16:46:51,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:51,245 - INFO - Going to convert document batch...
2025-11-14 16:46:51,246 - INFO - Processing document 8-K_2025-09-05
2025-11-14 16:46:51,270 - INFO - Finished converting document 8-K_2025-09-05 in 0.06 sec.
2025-11-14 16:46:51,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:51,304 - INFO - Going to convert document batch...
2025-11-14 16:46:51,305 - INFO - Processing document 8-K_2025-10-29
2025-11-14 16:46:51,323 - INFO - Finished converting document 8-K_2025-10-29 in 0.05 sec.
2025-11-14 16:46:51,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:46:51,369 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\GOOGL\8-K_2025-09-03' --> 'data\processed_data\GOOGL\8-K_2025-09-03.md'
Converted 'data\edgar_documents\GOOGL\8-K_2025-09-05' --> 'data\processed_data\GOOGL\8-K_2025-09-05.md'
Converted 'data\edgar_documents\GOOGL\8-K_2025-10-29' --> 'data\processed_data\GOOGL\8-K_2025-10-29.md'


2025-11-14 16:46:51,463 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:46:51,466 - ERROR - Input document DEF-14A_2023-04-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:46:51,469 - INFO - Going to convert document batch...
2025-11-14 16:46:51,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\8-K_2025-11-06' --> 'data\processed_data\GOOGL\8-K_2025-11-06.md'
Error processing data\edgar_documents\GOOGL\DEF-14A_2023-04-21: File format not allowed: data\edgar_documents\GOOGL\DEF-14A_2023-04-21


2025-11-14 16:46:52,370 - INFO - Going to convert document batch...
2025-11-14 16:46:52,371 - INFO - Processing document DEF-14A_2024-04-26
2025-11-14 16:46:54,685 - INFO - Finished converting document DEF-14A_2024-04-26 in 3.22 sec.
2025-11-14 16:46:56,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\DEF-14A_2024-04-26' --> 'data\processed_data\GOOGL\DEF-14A_2024-04-26.md'


2025-11-14 16:46:56,741 - INFO - Going to convert document batch...
2025-11-14 16:46:56,742 - INFO - Processing document DEF-14A_2025-04-25
2025-11-14 16:46:58,867 - INFO - Finished converting document DEF-14A_2025-04-25 in 2.70 sec.
2025-11-14 16:47:00,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\GOOGL\DEF-14A_2025-04-25' --> 'data\processed_data\GOOGL\DEF-14A_2025-04-25.md'
Processed 283 new files. Errors: 4
Found 104 files to process in data\edgar_documents\HD


2025-11-14 16:47:00,858 - INFO - Going to convert document batch...
2025-11-14 16:47:00,859 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:47:00,861 - INFO - Processing document 10-K_2023-03-15
2025-11-14 16:47:02,684 - INFO - Finished converting document 10-K_2023-03-15 in 2.47 sec.
2025-11-14 16:47:03,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-K_2023-03-15' --> 'data\processed_data\HD\10-K_2023-03-15.md'


2025-11-14 16:47:04,290 - INFO - Going to convert document batch...
2025-11-14 16:47:04,291 - INFO - Processing document 10-K_2024-03-13
2025-11-14 16:47:05,955 - INFO - Finished converting document 10-K_2024-03-13 in 2.70 sec.
2025-11-14 16:47:06,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-K_2024-03-13' --> 'data\processed_data\HD\10-K_2024-03-13.md'


2025-11-14 16:47:07,593 - INFO - Going to convert document batch...
2025-11-14 16:47:07,593 - INFO - Processing document 10-K_2025-03-21
2025-11-14 16:47:09,435 - INFO - Finished converting document 10-K_2025-03-21 in 2.97 sec.
2025-11-14 16:47:10,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-K_2025-03-21' --> 'data\processed_data\HD\10-K_2025-03-21.md'


2025-11-14 16:47:10,272 - INFO - Going to convert document batch...
2025-11-14 16:47:10,273 - INFO - Processing document 10-Q_2023-05-23
2025-11-14 16:47:10,701 - INFO - Finished converting document 10-Q_2023-05-23 in 0.67 sec.
2025-11-14 16:47:11,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-Q_2023-05-23' --> 'data\processed_data\HD\10-Q_2023-05-23.md'


2025-11-14 16:47:11,273 - INFO - Going to convert document batch...
2025-11-14 16:47:11,274 - INFO - Processing document 10-Q_2023-08-22
2025-11-14 16:47:11,755 - INFO - Finished converting document 10-Q_2023-08-22 in 0.77 sec.
2025-11-14 16:47:12,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-Q_2023-08-22' --> 'data\processed_data\HD\10-Q_2023-08-22.md'


2025-11-14 16:47:12,695 - INFO - Going to convert document batch...
2025-11-14 16:47:12,695 - INFO - Processing document 10-Q_2023-11-21
2025-11-14 16:47:13,311 - INFO - Finished converting document 10-Q_2023-11-21 in 1.31 sec.
2025-11-14 16:47:13,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-Q_2023-11-21' --> 'data\processed_data\HD\10-Q_2023-11-21.md'


2025-11-14 16:47:13,999 - INFO - Going to convert document batch...
2025-11-14 16:47:14,000 - INFO - Processing document 10-Q_2024-05-21
2025-11-14 16:47:14,402 - INFO - Finished converting document 10-Q_2024-05-21 in 0.72 sec.
2025-11-14 16:47:14,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-Q_2024-05-21' --> 'data\processed_data\HD\10-Q_2024-05-21.md'


2025-11-14 16:47:14,955 - INFO - Going to convert document batch...
2025-11-14 16:47:14,957 - INFO - Processing document 10-Q_2024-08-20
2025-11-14 16:47:15,660 - INFO - Finished converting document 10-Q_2024-08-20 in 1.05 sec.
2025-11-14 16:47:15,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-Q_2024-08-20' --> 'data\processed_data\HD\10-Q_2024-08-20.md'


2025-11-14 16:47:16,580 - INFO - Going to convert document batch...
2025-11-14 16:47:16,581 - INFO - Processing document 10-Q_2024-11-19
2025-11-14 16:47:17,172 - INFO - Finished converting document 10-Q_2024-11-19 in 1.22 sec.
2025-11-14 16:47:17,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-Q_2024-11-19' --> 'data\processed_data\HD\10-Q_2024-11-19.md'


2025-11-14 16:47:17,693 - INFO - Going to convert document batch...
2025-11-14 16:47:17,693 - INFO - Processing document 10-Q_2025-05-28
2025-11-14 16:47:18,152 - INFO - Finished converting document 10-Q_2025-05-28 in 0.72 sec.
2025-11-14 16:47:18,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\10-Q_2025-05-28' --> 'data\processed_data\HD\10-Q_2025-05-28.md'


2025-11-14 16:47:18,766 - INFO - Going to convert document batch...
2025-11-14 16:47:18,767 - INFO - Processing document 10-Q_2025-08-26
2025-11-14 16:47:19,786 - INFO - Finished converting document 10-Q_2025-08-26 in 1.39 sec.
2025-11-14 16:47:20,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:20,295 - INFO - Going to convert document batch...
2025-11-14 16:47:20,296 - INFO - Processing document 4_2023-02-02
2025-11-14 16:47:20,317 - INFO - Finished converting document 4_2023-02-02 in 0.05 sec.
2025-11-14 16:47:20,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:20,367 - INFO - Going to convert document batch...
2025-11-14 16:47:20,368 - INFO - Processing document 4_2023-02-24
2025-11-14 16:47:20,389 - INFO - Finished converting document 4_2023-02-24 in 0.05 sec.
2025-11-14 16:47:20,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:20,433 - INFO - Going to convert document batch...
2025-11-14 16:47:20,

Converted 'data\edgar_documents\HD\10-Q_2025-08-26' --> 'data\processed_data\HD\10-Q_2025-08-26.md'
Converted 'data\edgar_documents\HD\4_2023-02-02' --> 'data\processed_data\HD\4_2023-02-02.md'
Converted 'data\edgar_documents\HD\4_2023-02-24' --> 'data\processed_data\HD\4_2023-02-24.md'


2025-11-14 16:47:20,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:20,508 - INFO - Going to convert document batch...
2025-11-14 16:47:20,509 - INFO - Processing document 4_2023-03-15
2025-11-14 16:47:20,536 - INFO - Finished converting document 4_2023-03-15 in 0.05 sec.
2025-11-14 16:47:20,587 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:20,598 - INFO - Going to convert document batch...
2025-11-14 16:47:20,599 - INFO - Processing document 4_2023-03-23
2025-11-14 16:47:20,622 - INFO - Finished converting document 4_2023-03-23 in 0.06 sec.
2025-11-14 16:47:20,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:20,678 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HD\4_2023-03-01' --> 'data\processed_data\HD\4_2023-03-01.md'
Converted 'data\edgar_documents\HD\4_2023-03-15' --> 'data\processed_data\HD\4_2023-03-15.md'
Converted 'data\edgar_documents\HD\4_2023-03-23' --> 'data\processed_data\HD\4_2023-03-23.md'


2025-11-14 16:47:20,679 - INFO - Processing document 4_2023-05-19
2025-11-14 16:47:20,717 - INFO - Finished converting document 4_2023-05-19 in 0.06 sec.
2025-11-14 16:47:20,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:20,935 - INFO - Going to convert document batch...
2025-11-14 16:47:20,936 - INFO - Processing document 4_2023-05-22
2025-11-14 16:47:20,971 - INFO - Finished converting document 4_2023-05-22 in 0.11 sec.
2025-11-14 16:47:21,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\4_2023-05-19' --> 'data\processed_data\HD\4_2023-05-19.md'
Converted 'data\edgar_documents\HD\4_2023-05-22' --> 'data\processed_data\HD\4_2023-05-22.md'


2025-11-14 16:47:21,075 - INFO - Going to convert document batch...
2025-11-14 16:47:21,076 - INFO - Processing document 4_2023-05-23
2025-11-14 16:47:21,116 - INFO - Finished converting document 4_2023-05-23 in 0.11 sec.
2025-11-14 16:47:21,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:21,235 - INFO - Going to convert document batch...
2025-11-14 16:47:21,237 - INFO - Processing document 4_2023-08-22
2025-11-14 16:47:21,266 - INFO - Finished converting document 4_2023-08-22 in 0.09 sec.
2025-11-14 16:47:21,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:21,341 - INFO - Going to convert document batch...
2025-11-14 16:47:21,344 - INFO - Processing document 4_2023-08-24
2025-11-14 16:47:21,376 - INFO - Finished converting document 4_2023-08-24 in 0.08 sec.


Converted 'data\edgar_documents\HD\4_2023-05-23' --> 'data\processed_data\HD\4_2023-05-23.md'
Converted 'data\edgar_documents\HD\4_2023-08-22' --> 'data\processed_data\HD\4_2023-08-22.md'


2025-11-14 16:47:21,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:21,418 - INFO - Going to convert document batch...
2025-11-14 16:47:21,420 - INFO - Processing document 4_2023-08-25
2025-11-14 16:47:21,449 - INFO - Finished converting document 4_2023-08-25 in 0.06 sec.
2025-11-14 16:47:21,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:21,500 - INFO - Going to convert document batch...
2025-11-14 16:47:21,501 - INFO - Processing document 4_2023-09-06
2025-11-14 16:47:21,523 - INFO - Finished converting document 4_2023-09-06 in 0.05 sec.
2025-11-14 16:47:21,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:21,569 - INFO - Going to convert document batch...
2025-11-14 16:47:21,570 - INFO - Processing document 4_2023-09-26


Converted 'data\edgar_documents\HD\4_2023-08-24' --> 'data\processed_data\HD\4_2023-08-24.md'
Converted 'data\edgar_documents\HD\4_2023-08-25' --> 'data\processed_data\HD\4_2023-08-25.md'
Converted 'data\edgar_documents\HD\4_2023-09-06' --> 'data\processed_data\HD\4_2023-09-06.md'


2025-11-14 16:47:21,589 - INFO - Finished converting document 4_2023-09-26 in 0.05 sec.
2025-11-14 16:47:21,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:21,641 - INFO - Going to convert document batch...
2025-11-14 16:47:21,643 - INFO - Processing document 4_2023-11-17
2025-11-14 16:47:21,670 - INFO - Finished converting document 4_2023-11-17 in 0.06 sec.
2025-11-14 16:47:21,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:21,715 - INFO - Going to convert document batch...
2025-11-14 16:47:21,716 - INFO - Processing document 4_2023-11-21
2025-11-14 16:47:21,747 - INFO - Finished converting document 4_2023-11-21 in 0.06 sec.
2025-11-14 16:47:21,793 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\4_2023-09-26' --> 'data\processed_data\HD\4_2023-09-26.md'
Converted 'data\edgar_documents\HD\4_2023-11-17' --> 'data\processed_data\HD\4_2023-11-17.md'
Converted 'data\edgar_documents\HD\4_2023-11-21' --> 'data\processed_data\HD\4_2023-11-21.md'


2025-11-14 16:47:21,801 - INFO - Going to convert document batch...
2025-11-14 16:47:21,802 - INFO - Processing document 4_2023-11-27
2025-11-14 16:47:21,829 - INFO - Finished converting document 4_2023-11-27 in 0.06 sec.
2025-11-14 16:47:21,943 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:47:21,944 - ERROR - Input document 4_2023-11-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:47:21,946 - INFO - Going to convert document batch...
2025-11-14 16:47:21,976 - IN

Converted 'data\edgar_documents\HD\4_2023-11-27' --> 'data\processed_data\HD\4_2023-11-27.md'
Error processing data\edgar_documents\HD\4_2023-11-28: File format not allowed: data\edgar_documents\HD\4_2023-11-28
Converted 'data\edgar_documents\HD\4_2023-11-30' --> 'data\processed_data\HD\4_2023-11-30.md'


2025-11-14 16:47:22,059 - INFO - Going to convert document batch...
2025-11-14 16:47:22,059 - INFO - Processing document 4_2024-01-31
2025-11-14 16:47:22,093 - INFO - Finished converting document 4_2024-01-31 in 0.06 sec.
2025-11-14 16:47:22,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:22,146 - INFO - Going to convert document batch...
2025-11-14 16:47:22,148 - INFO - Processing document 4_2024-02-02
2025-11-14 16:47:22,170 - INFO - Finished converting document 4_2024-02-02 in 0.06 sec.
2025-11-14 16:47:22,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:22,231 - INFO - Going to convert document batch...
2025-11-14 16:47:22,233 - INFO - Processing document 4_2024-02-23
2025-11-14 16:47:22,262 - INFO - Finished converting document 4_2024-02-23 in 0.08 sec.
2025-11-14 16:47:22,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\4_2024-01-31' --> 'data\processed_data\HD\4_2024-01-31.md'
Converted 'data\edgar_documents\HD\4_2024-02-02' --> 'data\processed_data\HD\4_2024-02-02.md'
Converted 'data\edgar_documents\HD\4_2024-02-23' --> 'data\processed_data\HD\4_2024-02-23.md'


2025-11-14 16:47:22,302 - INFO - Going to convert document batch...
2025-11-14 16:47:22,302 - INFO - Processing document 4_2024-02-26
2025-11-14 16:47:22,326 - INFO - Finished converting document 4_2024-02-26 in 0.05 sec.
2025-11-14 16:47:22,370 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:22,379 - INFO - Going to convert document batch...
2025-11-14 16:47:22,380 - INFO - Processing document 4_2024-02-29
2025-11-14 16:47:22,400 - INFO - Finished converting document 4_2024-02-29 in 0.03 sec.
2025-11-14 16:47:22,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:22,462 - INFO - Going to convert document batch...
2025-11-14 16:47:22,463 - INFO - Processing document 4_2024-03-22
2025-11-14 16:47:22,487 - INFO - Finished converting document 4_2024-03-22 in 0.06 sec.
2025-11-14 16:47:22,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:22,550 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HD\4_2024-02-26' --> 'data\processed_data\HD\4_2024-02-26.md'
Converted 'data\edgar_documents\HD\4_2024-02-29' --> 'data\processed_data\HD\4_2024-02-29.md'
Converted 'data\edgar_documents\HD\4_2024-03-22' --> 'data\processed_data\HD\4_2024-03-22.md'


2025-11-14 16:47:22,551 - INFO - Processing document 4_2024-03-29
2025-11-14 16:47:22,578 - INFO - Finished converting document 4_2024-03-29 in 0.06 sec.
2025-11-14 16:47:22,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:22,745 - INFO - Going to convert document batch...
2025-11-14 16:47:22,746 - INFO - Processing document 4_2024-05-17
2025-11-14 16:47:22,769 - INFO - Finished converting document 4_2024-05-17 in 0.08 sec.
2025-11-14 16:47:22,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:22,820 - INFO - Going to convert document batch...
2025-11-14 16:47:22,820 - INFO - Processing document 4_2024-05-20
2025-11-14 16:47:22,852 - INFO - Finished converting document 4_2024-05-20 in 0.06 sec.


Converted 'data\edgar_documents\HD\4_2024-03-29' --> 'data\processed_data\HD\4_2024-03-29.md'
Converted 'data\edgar_documents\HD\4_2024-05-17' --> 'data\processed_data\HD\4_2024-05-17.md'


2025-11-14 16:47:22,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:22,912 - INFO - Going to convert document batch...
2025-11-14 16:47:22,913 - INFO - Processing document 4_2024-05-21
2025-11-14 16:47:22,943 - INFO - Finished converting document 4_2024-05-21 in 0.05 sec.
2025-11-14 16:47:22,993 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:47:22,994 - ERROR - Input document 4_2024-06-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:47

Converted 'data\edgar_documents\HD\4_2024-05-20' --> 'data\processed_data\HD\4_2024-05-20.md'
Converted 'data\edgar_documents\HD\4_2024-05-21' --> 'data\processed_data\HD\4_2024-05-21.md'
Error processing data\edgar_documents\HD\4_2024-06-17: File format not allowed: data\edgar_documents\HD\4_2024-06-17
Error processing data\edgar_documents\HD\4_2024-06-18: File format not allowed: data\edgar_documents\HD\4_2024-06-18


2025-11-14 16:47:23,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:23,121 - INFO - Going to convert document batch...
2025-11-14 16:47:23,122 - INFO - Processing document 4_2024-08-20
2025-11-14 16:47:23,148 - INFO - Finished converting document 4_2024-08-20 in 0.05 sec.
2025-11-14 16:47:23,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:23,199 - INFO - Going to convert document batch...
2025-11-14 16:47:23,217 - INFO - Processing document 4_2024-09-25
2025-11-14 16:47:23,288 - INFO - Finished converting document 4_2024-09-25 in 0.11 sec.


Converted 'data\edgar_documents\HD\4_2024-08-19' --> 'data\processed_data\HD\4_2024-08-19.md'
Converted 'data\edgar_documents\HD\4_2024-08-20' --> 'data\processed_data\HD\4_2024-08-20.md'


2025-11-14 16:47:23,370 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:23,392 - INFO - Going to convert document batch...
2025-11-14 16:47:23,393 - INFO - Processing document 4_2024-11-15
2025-11-14 16:47:23,441 - INFO - Finished converting document 4_2024-11-15 in 0.11 sec.


Converted 'data\edgar_documents\HD\4_2024-09-25' --> 'data\processed_data\HD\4_2024-09-25.md'
Converted 'data\edgar_documents\HD\4_2024-11-15' --> 'data\processed_data\HD\4_2024-11-15.md'


2025-11-14 16:47:23,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:23,544 - INFO - Going to convert document batch...
2025-11-14 16:47:23,545 - INFO - Processing document 4_2024-11-20
2025-11-14 16:47:23,578 - INFO - Finished converting document 4_2024-11-20 in 0.11 sec.
2025-11-14 16:47:23,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:23,672 - INFO - Going to convert document batch...
2025-11-14 16:47:23,674 - INFO - Processing document 4_2024-11-22
2025-11-14 16:47:23,709 - INFO - Finished converting document 4_2024-11-22 in 0.09 sec.
2025-11-14 16:47:23,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\4_2024-11-20' --> 'data\processed_data\HD\4_2024-11-20.md'
Converted 'data\edgar_documents\HD\4_2024-11-22' --> 'data\processed_data\HD\4_2024-11-22.md'


2025-11-14 16:47:23,810 - INFO - Going to convert document batch...
2025-11-14 16:47:23,811 - INFO - Processing document 4_2024-11-25
2025-11-14 16:47:23,854 - INFO - Finished converting document 4_2024-11-25 in 0.12 sec.
2025-11-14 16:47:23,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:23,958 - INFO - Going to convert document batch...
2025-11-14 16:47:23,960 - INFO - Processing document 4_2024-12-02
2025-11-14 16:47:23,993 - INFO - Finished converting document 4_2024-12-02 in 0.09 sec.
2025-11-14 16:47:24,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,052 - INFO - Going to convert document batch...
2025-11-14 16:47:24,052 - INFO - Processing document 4_2025-02-04
2025-11-14 16:47:24,083 - INFO - Finished converting document 4_2025-02-04 in 0.05 sec.


Converted 'data\edgar_documents\HD\4_2024-11-25' --> 'data\processed_data\HD\4_2024-11-25.md'
Converted 'data\edgar_documents\HD\4_2024-12-02' --> 'data\processed_data\HD\4_2024-12-02.md'


2025-11-14 16:47:24,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,130 - INFO - Going to convert document batch...
2025-11-14 16:47:24,131 - INFO - Processing document 4_2025-02-20
2025-11-14 16:47:24,153 - INFO - Finished converting document 4_2025-02-20 in 0.05 sec.
2025-11-14 16:47:24,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,202 - INFO - Going to convert document batch...
2025-11-14 16:47:24,203 - INFO - Processing document 4_2025-02-28
2025-11-14 16:47:24,231 - INFO - Finished converting document 4_2025-02-28 in 0.06 sec.
2025-11-14 16:47:24,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,276 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HD\4_2025-02-04' --> 'data\processed_data\HD\4_2025-02-04.md'
Converted 'data\edgar_documents\HD\4_2025-02-20' --> 'data\processed_data\HD\4_2025-02-20.md'
Converted 'data\edgar_documents\HD\4_2025-02-28' --> 'data\processed_data\HD\4_2025-02-28.md'


2025-11-14 16:47:24,277 - INFO - Processing document 4_2025-03-03
2025-11-14 16:47:24,304 - INFO - Finished converting document 4_2025-03-03 in 0.05 sec.
2025-11-14 16:47:24,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,369 - INFO - Going to convert document batch...
2025-11-14 16:47:24,370 - INFO - Processing document 4_2025-03-17
2025-11-14 16:47:24,395 - INFO - Finished converting document 4_2025-03-17 in 0.05 sec.
2025-11-14 16:47:24,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,441 - INFO - Going to convert document batch...
2025-11-14 16:47:24,442 - INFO - Processing document 4_2025-03-18
2025-11-14 16:47:24,466 - INFO - Finished converting document 4_2025-03-18 in 0.05 sec.
2025-11-14 16:47:24,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,529 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HD\4_2025-03-03' --> 'data\processed_data\HD\4_2025-03-03.md'
Converted 'data\edgar_documents\HD\4_2025-03-17' --> 'data\processed_data\HD\4_2025-03-17.md'
Converted 'data\edgar_documents\HD\4_2025-03-18' --> 'data\processed_data\HD\4_2025-03-18.md'


2025-11-14 16:47:24,530 - INFO - Processing document 4_2025-03-25
2025-11-14 16:47:24,553 - INFO - Finished converting document 4_2025-03-25 in 0.06 sec.
2025-11-14 16:47:24,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,609 - INFO - Going to convert document batch...
2025-11-14 16:47:24,610 - INFO - Processing document 4_2025-03-27
2025-11-14 16:47:24,637 - INFO - Finished converting document 4_2025-03-27 in 0.06 sec.
2025-11-14 16:47:24,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,686 - INFO - Going to convert document batch...
2025-11-14 16:47:24,686 - INFO - Processing document 4_2025-04-14
2025-11-14 16:47:24,711 - INFO - Finished converting document 4_2025-04-14 in 0.05 sec.
2025-11-14 16:47:24,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,773 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HD\4_2025-03-25' --> 'data\processed_data\HD\4_2025-03-25.md'
Converted 'data\edgar_documents\HD\4_2025-03-27' --> 'data\processed_data\HD\4_2025-03-27.md'
Converted 'data\edgar_documents\HD\4_2025-04-14' --> 'data\processed_data\HD\4_2025-04-14.md'


2025-11-14 16:47:24,775 - INFO - Processing document 4_2025-05-23
2025-11-14 16:47:24,812 - INFO - Finished converting document 4_2025-05-23 in 0.08 sec.
2025-11-14 16:47:24,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,911 - INFO - Going to convert document batch...
2025-11-14 16:47:24,912 - INFO - Processing document 4_2025-05-27
2025-11-14 16:47:24,935 - INFO - Finished converting document 4_2025-05-27 in 0.09 sec.
2025-11-14 16:47:24,975 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:24,987 - INFO - Going to convert document batch...
2025-11-14 16:47:24,987 - INFO - Processing document 4_2025-05-29
2025-11-14 16:47:25,018 - INFO - Finished converting document 4_2025-05-29 in 0.06 sec.


Converted 'data\edgar_documents\HD\4_2025-05-23' --> 'data\processed_data\HD\4_2025-05-23.md'
Converted 'data\edgar_documents\HD\4_2025-05-27' --> 'data\processed_data\HD\4_2025-05-27.md'
Converted 'data\edgar_documents\HD\4_2025-05-29' --> 'data\processed_data\HD\4_2025-05-29.md'


2025-11-14 16:47:25,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:25,067 - INFO - Going to convert document batch...
2025-11-14 16:47:25,068 - INFO - Processing document 4_2025-06-04
2025-11-14 16:47:25,101 - INFO - Finished converting document 4_2025-06-04 in 0.05 sec.
2025-11-14 16:47:25,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:25,148 - INFO - Going to convert document batch...
2025-11-14 16:47:25,149 - INFO - Processing document 4_2025-08-19
2025-11-14 16:47:25,170 - INFO - Finished converting document 4_2025-08-19 in 0.05 sec.
2025-11-14 16:47:25,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:25,234 - INFO - Going to convert document batch...
2025-11-14 16:47:25,235 - INFO - Processing document 4_2025-08-22
2025-11-14 16:47:25,261 - INFO - Finished converting document 4_2025-08-22 in 0.08 sec.
2025-11-14 16:47:25,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\HD\4_2025-06-04' --> 'data\processed_data\HD\4_2025-06-04.md'
Converted 'data\edgar_documents\HD\4_2025-08-19' --> 'data\processed_data\HD\4_2025-08-19.md'
Converted 'data\edgar_documents\HD\4_2025-08-22' --> 'data\processed_data\HD\4_2025-08-22.md'


2025-11-14 16:47:25,377 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:47:25,378 - ERROR - Input document 4_2025-09-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:47:25,379 - INFO - Going to convert document batch...
2025-11-14 16:47:25,401 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:47:25,402 - ERROR - Input document 4_2025-09-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\HD\4_2025-08-25' --> 'data\processed_data\HD\4_2025-08-25.md'
Error processing data\edgar_documents\HD\4_2025-09-08: File format not allowed: data\edgar_documents\HD\4_2025-09-08
Error processing data\edgar_documents\HD\4_2025-09-10: File format not allowed: data\edgar_documents\HD\4_2025-09-10
Converted 'data\edgar_documents\HD\4_2025-09-15' --> 'data\processed_data\HD\4_2025-09-15.md'


2025-11-14 16:47:25,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:25,585 - INFO - Going to convert document batch...
2025-11-14 16:47:25,586 - INFO - Processing document 8-K_2023-02-21
2025-11-14 16:47:25,618 - INFO - Finished converting document 8-K_2023-02-21 in 0.06 sec.
2025-11-14 16:47:25,721 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:25,734 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HD\4_2025-09-24' --> 'data\processed_data\HD\4_2025-09-24.md'
Converted 'data\edgar_documents\HD\8-K_2023-02-21' --> 'data\processed_data\HD\8-K_2023-02-21.md'


2025-11-14 16:47:25,734 - INFO - Processing document 8-K_2023-02-28
2025-11-14 16:47:25,758 - INFO - Finished converting document 8-K_2023-02-28 in 0.08 sec.
2025-11-14 16:47:25,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:25,798 - INFO - Going to convert document batch...
2025-11-14 16:47:25,799 - INFO - Processing document 8-K_2023-04-19
2025-11-14 16:47:25,816 - INFO - Finished converting document 8-K_2023-04-19 in 0.05 sec.
2025-11-14 16:47:25,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:25,864 - INFO - Going to convert document batch...
2025-11-14 16:47:25,864 - INFO - Processing document 8-K_2023-05-16
2025-11-14 16:47:25,882 - INFO - Finished converting document 8-K_2023-05-16 in 0.05 sec.
2025-11-14 16:47:25,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:25,952 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HD\8-K_2023-02-28' --> 'data\processed_data\HD\8-K_2023-02-28.md'
Converted 'data\edgar_documents\HD\8-K_2023-04-19' --> 'data\processed_data\HD\8-K_2023-04-19.md'
Converted 'data\edgar_documents\HD\8-K_2023-05-16' --> 'data\processed_data\HD\8-K_2023-05-16.md'


2025-11-14 16:47:25,953 - INFO - Processing document 8-K_2023-05-23
2025-11-14 16:47:26,007 - INFO - Finished converting document 8-K_2023-05-23 in 0.11 sec.
2025-11-14 16:47:26,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:26,099 - INFO - Going to convert document batch...
2025-11-14 16:47:26,100 - INFO - Processing document 8-K_2023-06-20
2025-11-14 16:47:26,116 - INFO - Finished converting document 8-K_2023-06-20 in 0.06 sec.
2025-11-14 16:47:26,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:26,148 - INFO - Going to convert document batch...
2025-11-14 16:47:26,149 - INFO - Processing document 8-K_2023-07-13
2025-11-14 16:47:26,163 - INFO - Finished converting document 8-K_2023-07-13 in 0.03 sec.
2025-11-14 16:47:26,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:26,203 - INFO - Going to convert document batch...
2025-11-14 16:47:26,204 - INFO - Processing document 8-K_2023-08-15
2025-11-14 16:

Converted 'data\edgar_documents\HD\8-K_2023-05-23' --> 'data\processed_data\HD\8-K_2023-05-23.md'
Converted 'data\edgar_documents\HD\8-K_2023-06-20' --> 'data\processed_data\HD\8-K_2023-06-20.md'
Converted 'data\edgar_documents\HD\8-K_2023-07-13' --> 'data\processed_data\HD\8-K_2023-07-13.md'


2025-11-14 16:47:26,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:26,263 - INFO - Going to convert document batch...
2025-11-14 16:47:26,263 - INFO - Processing document 8-K_2023-10-30
2025-11-14 16:47:26,283 - INFO - Finished converting document 8-K_2023-10-30 in 0.05 sec.
2025-11-14 16:47:26,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:26,400 - INFO - Going to convert document batch...
2025-11-14 16:47:26,401 - INFO - Processing document 8-K_2023-11-14
2025-11-14 16:47:26,428 - INFO - Finished converting document 8-K_2023-11-14 in 0.12 sec.


Converted 'data\edgar_documents\HD\8-K_2023-08-15' --> 'data\processed_data\HD\8-K_2023-08-15.md'
Converted 'data\edgar_documents\HD\8-K_2023-10-30' --> 'data\processed_data\HD\8-K_2023-10-30.md'


2025-11-14 16:47:26,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:26,485 - INFO - Going to convert document batch...
2025-11-14 16:47:26,486 - INFO - Processing document 8-K_2023-11-28
2025-11-14 16:47:26,505 - INFO - Finished converting document 8-K_2023-11-28 in 0.06 sec.
2025-11-14 16:47:26,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:26,550 - INFO - Going to convert document batch...
2025-11-14 16:47:26,551 - INFO - Processing document 8-K_2023-12-05


Converted 'data\edgar_documents\HD\8-K_2023-11-14' --> 'data\processed_data\HD\8-K_2023-11-14.md'
Converted 'data\edgar_documents\HD\8-K_2023-11-28' --> 'data\processed_data\HD\8-K_2023-11-28.md'


2025-11-14 16:47:26,957 - INFO - Finished converting document 8-K_2023-12-05 in 0.44 sec.
2025-11-14 16:47:26,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,095 - INFO - Going to convert document batch...
2025-11-14 16:47:27,096 - INFO - Processing document 8-K_2024-01-10
2025-11-14 16:47:27,122 - INFO - Finished converting document 8-K_2024-01-10 in 0.16 sec.
2025-11-14 16:47:27,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,154 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HD\8-K_2023-12-05' --> 'data\processed_data\HD\8-K_2023-12-05.md'
Converted 'data\edgar_documents\HD\8-K_2024-01-10' --> 'data\processed_data\HD\8-K_2024-01-10.md'


2025-11-14 16:47:27,155 - INFO - Processing document 8-K_2024-02-20
2025-11-14 16:47:27,173 - INFO - Finished converting document 8-K_2024-02-20 in 0.05 sec.
2025-11-14 16:47:27,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,215 - INFO - Going to convert document batch...
2025-11-14 16:47:27,216 - INFO - Processing document 8-K_2024-03-28
2025-11-14 16:47:27,250 - INFO - Finished converting document 8-K_2024-03-28 in 0.06 sec.
2025-11-14 16:47:27,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,312 - INFO - Going to convert document batch...
2025-11-14 16:47:27,313 - INFO - Processing document 8-K_2024-05-09
2025-11-14 16:47:27,329 - INFO - Finished converting document 8-K_2024-05-09 in 0.06 sec.
2025-11-14 16:47:27,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,362 - INFO - Going to convert document batch...
2025-11-14 16:47:27,362 - INFO - Processing document 8-K_2024-05-14
2025-11-14 16:

Converted 'data\edgar_documents\HD\8-K_2024-02-20' --> 'data\processed_data\HD\8-K_2024-02-20.md'
Converted 'data\edgar_documents\HD\8-K_2024-03-28' --> 'data\processed_data\HD\8-K_2024-03-28.md'
Converted 'data\edgar_documents\HD\8-K_2024-05-09' --> 'data\processed_data\HD\8-K_2024-05-09.md'


2025-11-14 16:47:27,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,433 - INFO - Going to convert document batch...
2025-11-14 16:47:27,434 - INFO - Processing document 8-K_2024-05-22
2025-11-14 16:47:27,563 - INFO - Finished converting document 8-K_2024-05-22 in 0.17 sec.


Converted 'data\edgar_documents\HD\8-K_2024-05-14' --> 'data\processed_data\HD\8-K_2024-05-14.md'
Converted 'data\edgar_documents\HD\8-K_2024-05-22' --> 'data\processed_data\HD\8-K_2024-05-22.md'


2025-11-14 16:47:27,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,666 - INFO - Going to convert document batch...
2025-11-14 16:47:27,667 - INFO - Processing document 8-K_2024-05-30
2025-11-14 16:47:27,686 - INFO - Finished converting document 8-K_2024-05-30 in 0.09 sec.
2025-11-14 16:47:27,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,732 - INFO - Going to convert document batch...
2025-11-14 16:47:27,732 - INFO - Processing document 8-K_2024-06-18
2025-11-14 16:47:27,754 - INFO - Finished converting document 8-K_2024-06-18 in 0.06 sec.
2025-11-14 16:47:27,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,796 - INFO - Going to convert document batch...
2025-11-14 16:47:27,797 - INFO - Processing document 8-K_2024-06-25
2025-11-14 16:47:27,830 - INFO - Finished converting document 8-K_2024-06-25 in 0.06 sec.
2025-11-14 16:47:27,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\HD\8-K_2024-05-30' --> 'data\processed_data\HD\8-K_2024-05-30.md'
Converted 'data\edgar_documents\HD\8-K_2024-06-18' --> 'data\processed_data\HD\8-K_2024-06-18.md'
Converted 'data\edgar_documents\HD\8-K_2024-06-25' --> 'data\processed_data\HD\8-K_2024-06-25.md'


2025-11-14 16:47:27,877 - INFO - Processing document 8-K_2024-06-27
2025-11-14 16:47:27,895 - INFO - Finished converting document 8-K_2024-06-27 in 0.05 sec.
2025-11-14 16:47:27,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:27,935 - INFO - Going to convert document batch...
2025-11-14 16:47:27,936 - INFO - Processing document 8-K_2024-08-13
2025-11-14 16:47:28,002 - INFO - Finished converting document 8-K_2024-08-13 in 0.09 sec.


Converted 'data\edgar_documents\HD\8-K_2024-06-27' --> 'data\processed_data\HD\8-K_2024-06-27.md'
Converted 'data\edgar_documents\HD\8-K_2024-08-13' --> 'data\processed_data\HD\8-K_2024-08-13.md'


2025-11-14 16:47:28,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:28,131 - INFO - Going to convert document batch...
2025-11-14 16:47:28,132 - INFO - Processing document 8-K_2024-11-12
2025-11-14 16:47:28,151 - INFO - Finished converting document 8-K_2024-11-12 in 0.11 sec.
2025-11-14 16:47:28,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:28,194 - INFO - Going to convert document batch...
2025-11-14 16:47:28,196 - INFO - Processing document 8-K_2024-12-19
2025-11-14 16:47:28,211 - INFO - Finished converting document 8-K_2024-12-19 in 0.03 sec.
2025-11-14 16:47:28,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:28,242 - INFO - Going to convert document batch...
2025-11-14 16:47:28,242 - INFO - Processing document 8-K_2025-02-25
2025-11-14 16:47:28,268 - INFO - Finished converting document 8-K_2025-02-25 in 0.05 sec.
2025-11-14 16:47:28,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\HD\8-K_2024-11-12' --> 'data\processed_data\HD\8-K_2024-11-12.md'
Converted 'data\edgar_documents\HD\8-K_2024-12-19' --> 'data\processed_data\HD\8-K_2024-12-19.md'
Converted 'data\edgar_documents\HD\8-K_2025-02-25' --> 'data\processed_data\HD\8-K_2025-02-25.md'
Converted 'data\edgar_documents\HD\8-K_2025-05-06' --> 'data\processed_data\HD\8-K_2025-05-06.md'


2025-11-14 16:47:28,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:28,521 - INFO - Going to convert document batch...
2025-11-14 16:47:28,523 - INFO - Processing document 8-K_2025-05-28
2025-11-14 16:47:28,561 - INFO - Finished converting document 8-K_2025-05-28 in 0.19 sec.


Converted 'data\edgar_documents\HD\8-K_2025-05-20' --> 'data\processed_data\HD\8-K_2025-05-20.md'


2025-11-14 16:47:28,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:28,612 - INFO - Going to convert document batch...
2025-11-14 16:47:28,613 - INFO - Processing document 8-K_2025-08-19
2025-11-14 16:47:28,635 - INFO - Finished converting document 8-K_2025-08-19 in 0.06 sec.
2025-11-14 16:47:28,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:28,764 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HD\8-K_2025-05-28' --> 'data\processed_data\HD\8-K_2025-05-28.md'
Converted 'data\edgar_documents\HD\8-K_2025-08-19' --> 'data\processed_data\HD\8-K_2025-08-19.md'


2025-11-14 16:47:28,766 - INFO - Processing document 8-K_2025-09-10
2025-11-14 16:47:28,793 - INFO - Finished converting document 8-K_2025-09-10 in 0.16 sec.
2025-11-14 16:47:28,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:28,875 - INFO - Going to convert document batch...
2025-11-14 16:47:28,877 - INFO - Processing document 8-K_2025-09-15
2025-11-14 16:47:28,942 - INFO - Finished converting document 8-K_2025-09-15 in 0.12 sec.


Converted 'data\edgar_documents\HD\8-K_2025-09-10' --> 'data\processed_data\HD\8-K_2025-09-10.md'
Converted 'data\edgar_documents\HD\8-K_2025-09-15' --> 'data\processed_data\HD\8-K_2025-09-15.md'


2025-11-14 16:47:29,061 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:29,527 - INFO - Going to convert document batch...
2025-11-14 16:47:29,527 - INFO - Processing document DEF-14A_2023-04-03
2025-11-14 16:47:31,400 - INFO - Finished converting document DEF-14A_2023-04-03 in 2.42 sec.
2025-11-14 16:47:32,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\DEF-14A_2023-04-03' --> 'data\processed_data\HD\DEF-14A_2023-04-03.md'


2025-11-14 16:47:32,669 - INFO - Going to convert document batch...
2025-11-14 16:47:32,671 - INFO - Processing document DEF-14A_2024-04-01
2025-11-14 16:47:34,339 - INFO - Finished converting document DEF-14A_2024-04-01 in 2.20 sec.
2025-11-14 16:47:35,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HD\DEF-14A_2024-04-01' --> 'data\processed_data\HD\DEF-14A_2024-04-01.md'


2025-11-14 16:47:35,793 - INFO - Going to convert document batch...
2025-11-14 16:47:35,794 - INFO - Processing document DEF-14A_2025-04-07
2025-11-14 16:47:37,321 - INFO - Finished converting document DEF-14A_2025-04-07 in 2.28 sec.


Converted 'data\edgar_documents\HD\DEF-14A_2025-04-07' --> 'data\processed_data\HD\DEF-14A_2025-04-07.md'
Processed 99 new files. Errors: 5
Found 158 files to process in data\edgar_documents\HON


2025-11-14 16:47:38,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:47:40,129 - INFO - Going to convert document batch...
2025-11-14 16:47:40,130 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:47:40,131 - INFO - Processing document 10-K_2023-02-10
2025-11-14 16:47:44,658 - INFO - Finished converting document 10-K_2023-02-10 in 6.59 sec.
2025-11-14 16:47:46,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-K_2023-02-10' --> 'data\processed_data\HON\10-K_2023-02-10.md'


2025-11-14 16:47:47,908 - INFO - Going to convert document batch...
2025-11-14 16:47:47,909 - INFO - Processing document 10-K_2024-02-16
2025-11-14 16:47:52,333 - INFO - Finished converting document 10-K_2024-02-16 in 6.11 sec.
2025-11-14 16:47:53,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-K_2024-02-16' --> 'data\processed_data\HON\10-K_2024-02-16.md'


2025-11-14 16:47:55,740 - INFO - Going to convert document batch...
2025-11-14 16:47:55,741 - INFO - Processing document 10-K_2025-02-14
2025-11-14 16:48:00,407 - INFO - Finished converting document 10-K_2025-02-14 in 6.75 sec.
2025-11-14 16:48:02,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-K_2025-02-14' --> 'data\processed_data\HON\10-K_2025-02-14.md'


2025-11-14 16:48:02,730 - INFO - Going to convert document batch...
2025-11-14 16:48:02,731 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 16:48:03,738 - INFO - Finished converting document 10-Q_2023-04-27 in 1.64 sec.
2025-11-14 16:48:05,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-Q_2023-04-27' --> 'data\processed_data\HON\10-Q_2023-04-27.md'


2025-11-14 16:48:05,711 - INFO - Going to convert document batch...
2025-11-14 16:48:05,711 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 16:48:07,236 - INFO - Finished converting document 10-Q_2023-07-27 in 2.30 sec.
2025-11-14 16:48:07,844 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-Q_2023-07-27' --> 'data\processed_data\HON\10-Q_2023-07-27.md'


2025-11-14 16:48:08,835 - INFO - Going to convert document batch...
2025-11-14 16:48:08,836 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 16:48:09,963 - INFO - Finished converting document 10-Q_2023-10-26 in 2.16 sec.
2025-11-14 16:48:10,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-Q_2023-10-26' --> 'data\processed_data\HON\10-Q_2023-10-26.md'


2025-11-14 16:48:11,697 - INFO - Going to convert document batch...
2025-11-14 16:48:11,697 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 16:48:12,612 - INFO - Finished converting document 10-Q_2024-04-25 in 1.91 sec.
2025-11-14 16:48:13,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-Q_2024-04-25' --> 'data\processed_data\HON\10-Q_2024-04-25.md'


2025-11-14 16:48:13,750 - INFO - Going to convert document batch...
2025-11-14 16:48:13,750 - INFO - Processing document 10-Q_2024-07-25
2025-11-14 16:48:14,919 - INFO - Finished converting document 10-Q_2024-07-25 in 1.84 sec.
2025-11-14 16:48:15,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-Q_2024-07-25' --> 'data\processed_data\HON\10-Q_2024-07-25.md'


2025-11-14 16:48:16,898 - INFO - Going to convert document batch...
2025-11-14 16:48:16,899 - INFO - Processing document 10-Q_2024-10-24
2025-11-14 16:48:18,410 - INFO - Finished converting document 10-Q_2024-10-24 in 2.78 sec.
2025-11-14 16:48:19,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-Q_2024-10-24' --> 'data\processed_data\HON\10-Q_2024-10-24.md'


2025-11-14 16:48:19,899 - INFO - Going to convert document batch...
2025-11-14 16:48:19,901 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 16:48:20,859 - INFO - Finished converting document 10-Q_2025-04-29 in 1.83 sec.
2025-11-14 16:48:21,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-Q_2025-04-29' --> 'data\processed_data\HON\10-Q_2025-04-29.md'


2025-11-14 16:48:22,207 - INFO - Going to convert document batch...
2025-11-14 16:48:22,207 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 16:48:24,162 - INFO - Finished converting document 10-Q_2025-07-24 in 2.77 sec.
2025-11-14 16:48:24,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\10-Q_2025-07-24' --> 'data\processed_data\HON\10-Q_2025-07-24.md'


2025-11-14 16:48:25,423 - INFO - Going to convert document batch...
2025-11-14 16:48:25,424 - INFO - Processing document 10-Q_2025-10-23
2025-11-14 16:48:26,886 - INFO - Finished converting document 10-Q_2025-10-23 in 2.16 sec.
2025-11-14 16:48:27,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:27,696 - INFO - Going to convert document batch...
2025-11-14 16:48:27,697 - INFO - Processing document 4_2023-01-05
2025-11-14 16:48:27,725 - INFO - Finished converting document 4_2023-01-05 in 0.08 sec.
2025-11-14 16:48:27,769 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:48:27,770 - ERROR - Input document 4_2023-01-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, 

Converted 'data\edgar_documents\HON\10-Q_2025-10-23' --> 'data\processed_data\HON\10-Q_2025-10-23.md'
Converted 'data\edgar_documents\HON\4_2023-01-05' --> 'data\processed_data\HON\4_2023-01-05.md'
Error processing data\edgar_documents\HON\4_2023-01-31: File format not allowed: data\edgar_documents\HON\4_2023-01-31


2025-11-14 16:48:28,354 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:28,368 - INFO - Going to convert document batch...
2025-11-14 16:48:28,369 - INFO - Processing document 4_2023-02-16
2025-11-14 16:48:28,398 - INFO - Finished converting document 4_2023-02-16 in 0.05 sec.
2025-11-14 16:48:28,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:28,462 - INFO - Going to convert document batch...
2025-11-14 16:48:28,462 - INFO - Processing document 4_2023-02-28
2025-11-14 16:48:28,494 - INFO - Finished converting document 4_2023-02-28 in 0.06 sec.
2025-11-14 16:48:28,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\4_2023-02-14' --> 'data\processed_data\HON\4_2023-02-14.md'
Converted 'data\edgar_documents\HON\4_2023-02-16' --> 'data\processed_data\HON\4_2023-02-16.md'
Converted 'data\edgar_documents\HON\4_2023-02-28' --> 'data\processed_data\HON\4_2023-02-28.md'


2025-11-14 16:48:28,541 - INFO - Going to convert document batch...
2025-11-14 16:48:28,542 - INFO - Processing document 4_2023-04-04
2025-11-14 16:48:28,560 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.
2025-11-14 16:48:28,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:28,718 - INFO - Going to convert document batch...
2025-11-14 16:48:28,719 - INFO - Processing document 4_2023-04-05
2025-11-14 16:48:28,742 - INFO - Finished converting document 4_2023-04-05 in 0.06 sec.
2025-11-14 16:48:28,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:28,796 - INFO - Going to convert document batch...
2025-11-14 16:48:28,797 - INFO - Processing document 4_2023-04-18
2025-11-14 16:48:28,823 - INFO - Finished converting document 4_2023-04-18 in 0.05 sec.


Converted 'data\edgar_documents\HON\4_2023-04-04' --> 'data\processed_data\HON\4_2023-04-04.md'
Converted 'data\edgar_documents\HON\4_2023-04-05' --> 'data\processed_data\HON\4_2023-04-05.md'
Converted 'data\edgar_documents\HON\4_2023-04-18' --> 'data\processed_data\HON\4_2023-04-18.md'


2025-11-14 16:48:28,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:28,890 - INFO - Going to convert document batch...
2025-11-14 16:48:28,891 - INFO - Processing document 4_2023-04-26
2025-11-14 16:48:28,921 - INFO - Finished converting document 4_2023-04-26 in 0.08 sec.
2025-11-14 16:48:28,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:28,979 - INFO - Going to convert document batch...
2025-11-14 16:48:28,979 - INFO - Processing document 4_2023-05-05
2025-11-14 16:48:29,008 - INFO - Finished converting document 4_2023-05-05 in 0.05 sec.
2025-11-14 16:48:29,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:29,082 - INFO - Going to convert document batch...
2025-11-14 16:48:29,083 - INFO - Processing document 4_2023-05-10
2025-11-14 16:48:29,127 - INFO - Finished converting document 4_2023-05-10 in 0.09 sec.


Converted 'data\edgar_documents\HON\4_2023-04-26' --> 'data\processed_data\HON\4_2023-04-26.md'
Converted 'data\edgar_documents\HON\4_2023-05-05' --> 'data\processed_data\HON\4_2023-05-05.md'


2025-11-14 16:48:29,220 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:48:29,221 - ERROR - Input document 4_2023-05-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:48:29,223 - INFO - Going to convert document batch...
2025-11-14 16:48:29,243 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:48:29,244 - ERROR - Input document 4_2023-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\HON\4_2023-05-10' --> 'data\processed_data\HON\4_2023-05-10.md'
Error processing data\edgar_documents\HON\4_2023-05-12: File format not allowed: data\edgar_documents\HON\4_2023-05-12
Error processing data\edgar_documents\HON\4_2023-05-15: File format not allowed: data\edgar_documents\HON\4_2023-05-15
Converted 'data\edgar_documents\HON\4_2023-05-23' --> 'data\processed_data\HON\4_2023-05-23.md'


2025-11-14 16:48:29,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:29,373 - INFO - Going to convert document batch...
2025-11-14 16:48:29,378 - INFO - Processing document 4_2023-06-05
2025-11-14 16:48:29,507 - INFO - Finished converting document 4_2023-06-05 in 0.17 sec.
2025-11-14 16:48:29,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:29,613 - INFO - Going to convert document batch...
2025-11-14 16:48:29,615 - INFO - Processing document 4_2023-06-14
2025-11-14 16:48:29,650 - INFO - Finished converting document 4_2023-06-14 in 0.09 sec.
2025-11-14 16:48:29,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\4_2023-06-05' --> 'data\processed_data\HON\4_2023-06-05.md'
Converted 'data\edgar_documents\HON\4_2023-06-14' --> 'data\processed_data\HON\4_2023-06-14.md'


2025-11-14 16:48:29,764 - INFO - Going to convert document batch...
2025-11-14 16:48:29,765 - INFO - Processing document 4_2023-07-06
2025-11-14 16:48:29,795 - INFO - Finished converting document 4_2023-07-06 in 0.11 sec.
2025-11-14 16:48:29,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:29,848 - INFO - Going to convert document batch...
2025-11-14 16:48:29,849 - INFO - Processing document 4_2023-07-27
2025-11-14 16:48:29,874 - INFO - Finished converting document 4_2023-07-27 in 0.05 sec.
2025-11-14 16:48:29,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:29,923 - INFO - Going to convert document batch...
2025-11-14 16:48:29,923 - INFO - Processing document 4_2023-07-31
2025-11-14 16:48:29,949 - INFO - Finished converting document 4_2023-07-31 in 0.06 sec.
2025-11-14 16:48:29,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,010 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\4_2023-07-06' --> 'data\processed_data\HON\4_2023-07-06.md'
Converted 'data\edgar_documents\HON\4_2023-07-27' --> 'data\processed_data\HON\4_2023-07-27.md'
Converted 'data\edgar_documents\HON\4_2023-07-31' --> 'data\processed_data\HON\4_2023-07-31.md'


2025-11-14 16:48:30,011 - INFO - Processing document 4_2023-08-01
2025-11-14 16:48:30,047 - INFO - Finished converting document 4_2023-08-01 in 0.08 sec.
2025-11-14 16:48:30,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,125 - INFO - Going to convert document batch...
2025-11-14 16:48:30,125 - INFO - Processing document 4_2023-08-02
2025-11-14 16:48:30,152 - INFO - Finished converting document 4_2023-08-02 in 0.06 sec.
2025-11-14 16:48:30,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,207 - INFO - Going to convert document batch...
2025-11-14 16:48:30,207 - INFO - Processing document 4_2023-08-03
2025-11-14 16:48:30,239 - INFO - Finished converting document 4_2023-08-03 in 0.06 sec.
2025-11-14 16:48:30,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,282 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\4_2023-08-01' --> 'data\processed_data\HON\4_2023-08-01.md'
Converted 'data\edgar_documents\HON\4_2023-08-02' --> 'data\processed_data\HON\4_2023-08-02.md'
Converted 'data\edgar_documents\HON\4_2023-08-03' --> 'data\processed_data\HON\4_2023-08-03.md'


2025-11-14 16:48:30,283 - INFO - Processing document 4_2023-08-30
2025-11-14 16:48:30,316 - INFO - Finished converting document 4_2023-08-30 in 0.05 sec.
2025-11-14 16:48:30,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,368 - INFO - Going to convert document batch...
2025-11-14 16:48:30,369 - INFO - Processing document 4_2023-10-04
2025-11-14 16:48:30,390 - INFO - Finished converting document 4_2023-10-04 in 0.05 sec.
2025-11-14 16:48:30,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,437 - INFO - Going to convert document batch...
2025-11-14 16:48:30,438 - INFO - Processing document 4_2023-10-05
2025-11-14 16:48:30,463 - INFO - Finished converting document 4_2023-10-05 in 0.06 sec.
2025-11-14 16:48:30,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,518 - INFO - Going to convert document batch...
2025-11-14 16:48:30,519 - INFO - Processing document 4_2023-11-03


Converted 'data\edgar_documents\HON\4_2023-08-30' --> 'data\processed_data\HON\4_2023-08-30.md'
Converted 'data\edgar_documents\HON\4_2023-10-04' --> 'data\processed_data\HON\4_2023-10-04.md'
Converted 'data\edgar_documents\HON\4_2023-10-05' --> 'data\processed_data\HON\4_2023-10-05.md'


2025-11-14 16:48:30,535 - INFO - Finished converting document 4_2023-11-03 in 0.05 sec.
2025-11-14 16:48:30,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,668 - INFO - Going to convert document batch...
2025-11-14 16:48:30,669 - INFO - Processing document 4_2023-11-07
2025-11-14 16:48:30,723 - INFO - Finished converting document 4_2023-11-07 in 0.16 sec.


Converted 'data\edgar_documents\HON\4_2023-11-03' --> 'data\processed_data\HON\4_2023-11-03.md'


2025-11-14 16:48:30,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,815 - INFO - Going to convert document batch...
2025-11-14 16:48:30,816 - INFO - Processing document 4_2023-11-13
2025-11-14 16:48:30,844 - INFO - Finished converting document 4_2023-11-13 in 0.06 sec.
2025-11-14 16:48:30,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:30,922 - INFO - Going to convert document batch...
2025-11-14 16:48:30,937 - INFO - Processing document 4_2023-11-16


Converted 'data\edgar_documents\HON\4_2023-11-07' --> 'data\processed_data\HON\4_2023-11-07.md'
Converted 'data\edgar_documents\HON\4_2023-11-13' --> 'data\processed_data\HON\4_2023-11-13.md'


2025-11-14 16:48:31,013 - INFO - Finished converting document 4_2023-11-16 in 0.14 sec.
2025-11-14 16:48:31,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:31,094 - INFO - Going to convert document batch...
2025-11-14 16:48:31,095 - INFO - Processing document 4_2023-11-20
2025-11-14 16:48:31,119 - INFO - Finished converting document 4_2023-11-20 in 0.08 sec.
2025-11-14 16:48:31,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:31,175 - INFO - Going to convert document batch...
2025-11-14 16:48:31,176 - INFO - Processing document 4_2023-11-27
2025-11-14 16:48:31,210 - INFO - Finished converting document 4_2023-11-27 in 0.06 sec.


Converted 'data\edgar_documents\HON\4_2023-11-16' --> 'data\processed_data\HON\4_2023-11-16.md'
Converted 'data\edgar_documents\HON\4_2023-11-20' --> 'data\processed_data\HON\4_2023-11-20.md'


2025-11-14 16:48:31,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:31,259 - INFO - Going to convert document batch...
2025-11-14 16:48:31,259 - INFO - Processing document 4_2024-01-04
2025-11-14 16:48:31,294 - INFO - Finished converting document 4_2024-01-04 in 0.06 sec.
2025-11-14 16:48:31,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:31,341 - INFO - Going to convert document batch...
2025-11-14 16:48:31,342 - INFO - Processing document 4_2024-02-07
2025-11-14 16:48:31,363 - INFO - Finished converting document 4_2024-02-07 in 0.05 sec.
2025-11-14 16:48:31,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:31,411 - INFO - Going to convert document batch...
2025-11-14 16:48:31,412 - INFO - Processing document 4_2024-02-13


Converted 'data\edgar_documents\HON\4_2023-11-27' --> 'data\processed_data\HON\4_2023-11-27.md'
Converted 'data\edgar_documents\HON\4_2024-01-04' --> 'data\processed_data\HON\4_2024-01-04.md'
Converted 'data\edgar_documents\HON\4_2024-02-07' --> 'data\processed_data\HON\4_2024-02-07.md'


2025-11-14 16:48:31,438 - INFO - Finished converting document 4_2024-02-13 in 0.05 sec.
2025-11-14 16:48:31,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:31,501 - INFO - Going to convert document batch...
2025-11-14 16:48:31,502 - INFO - Processing document 4_2024-02-14
2025-11-14 16:48:31,530 - INFO - Finished converting document 4_2024-02-14 in 0.06 sec.
2025-11-14 16:48:31,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:31,601 - INFO - Going to convert document batch...
2025-11-14 16:48:31,601 - INFO - Processing document 4_2024-02-16
2025-11-14 16:48:31,627 - INFO - Finished converting document 4_2024-02-16 in 0.06 sec.
2025-11-14 16:48:31,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\4_2024-02-13' --> 'data\processed_data\HON\4_2024-02-13.md'
Converted 'data\edgar_documents\HON\4_2024-02-14' --> 'data\processed_data\HON\4_2024-02-14.md'
Converted 'data\edgar_documents\HON\4_2024-02-16' --> 'data\processed_data\HON\4_2024-02-16.md'


2025-11-14 16:48:31,676 - INFO - Going to convert document batch...
2025-11-14 16:48:31,677 - INFO - Processing document 4_2024-02-20
2025-11-14 16:48:31,702 - INFO - Finished converting document 4_2024-02-20 in 0.05 sec.
2025-11-14 16:48:31,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:31,761 - INFO - Going to convert document batch...
2025-11-14 16:48:31,762 - INFO - Processing document 4_2024-02-21
2025-11-14 16:48:31,787 - INFO - Finished converting document 4_2024-02-21 in 0.05 sec.
2025-11-14 16:48:31,838 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:48:31,839 - ERROR - Input document 4_2024-02-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\HON\4_2024-02-20' --> 'data\processed_data\HON\4_2024-02-20.md'
Converted 'data\edgar_documents\HON\4_2024-02-21' --> 'data\processed_data\HON\4_2024-02-21.md'
Error processing data\edgar_documents\HON\4_2024-02-26: File format not allowed: data\edgar_documents\HON\4_2024-02-26
Error processing data\edgar_documents\HON\4_2024-02-28: File format not allowed: data\edgar_documents\HON\4_2024-02-28


2025-11-14 16:48:31,950 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:31,960 - INFO - Going to convert document batch...
2025-11-14 16:48:31,961 - INFO - Processing document 4_2024-04-03
2025-11-14 16:48:31,985 - INFO - Finished converting document 4_2024-04-03 in 0.05 sec.
2025-11-14 16:48:32,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,042 - INFO - Going to convert document batch...
2025-11-14 16:48:32,043 - INFO - Processing document 4_2024-04-17
2025-11-14 16:48:32,068 - INFO - Finished converting document 4_2024-04-17 in 0.05 sec.
2025-11-14 16:48:32,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,114 - INFO - Going to convert document batch...
2025-11-14 16:48:32,115 - INFO - Processing document 4_2024-05-01


Converted 'data\edgar_documents\HON\4_2024-02-29' --> 'data\processed_data\HON\4_2024-02-29.md'
Converted 'data\edgar_documents\HON\4_2024-04-03' --> 'data\processed_data\HON\4_2024-04-03.md'
Converted 'data\edgar_documents\HON\4_2024-04-17' --> 'data\processed_data\HON\4_2024-04-17.md'


2025-11-14 16:48:32,142 - INFO - Finished converting document 4_2024-05-01 in 0.05 sec.
2025-11-14 16:48:32,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,207 - INFO - Going to convert document batch...
2025-11-14 16:48:32,208 - INFO - Processing document 4_2024-05-02
2025-11-14 16:48:32,235 - INFO - Finished converting document 4_2024-05-02 in 0.06 sec.
2025-11-14 16:48:32,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,296 - INFO - Going to convert document batch...
2025-11-14 16:48:32,296 - INFO - Processing document 4_2024-05-15
2025-11-14 16:48:32,336 - INFO - Finished converting document 4_2024-05-15 in 0.06 sec.
2025-11-14 16:48:32,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\4_2024-05-01' --> 'data\processed_data\HON\4_2024-05-01.md'
Converted 'data\edgar_documents\HON\4_2024-05-02' --> 'data\processed_data\HON\4_2024-05-02.md'
Converted 'data\edgar_documents\HON\4_2024-05-15' --> 'data\processed_data\HON\4_2024-05-15.md'


2025-11-14 16:48:32,382 - INFO - Going to convert document batch...
2025-11-14 16:48:32,382 - INFO - Processing document 4_2024-05-16
2025-11-14 16:48:32,408 - INFO - Finished converting document 4_2024-05-16 in 0.05 sec.
2025-11-14 16:48:32,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,458 - INFO - Going to convert document batch...
2025-11-14 16:48:32,459 - INFO - Processing document 4_2024-05-17
2025-11-14 16:48:32,487 - INFO - Finished converting document 4_2024-05-17 in 0.05 sec.
2025-11-14 16:48:32,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,536 - INFO - Going to convert document batch...
2025-11-14 16:48:32,538 - INFO - Processing document 4_2024-06-11
2025-11-14 16:48:32,561 - INFO - Finished converting document 4_2024-06-11 in 0.05 sec.
2025-11-14 16:48:32,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,607 - INFO - Going to convert document batch...
2025-11-14 16:48:32,608 - 

Converted 'data\edgar_documents\HON\4_2024-05-16' --> 'data\processed_data\HON\4_2024-05-16.md'
Converted 'data\edgar_documents\HON\4_2024-05-17' --> 'data\processed_data\HON\4_2024-05-17.md'
Converted 'data\edgar_documents\HON\4_2024-06-11' --> 'data\processed_data\HON\4_2024-06-11.md'


2025-11-14 16:48:32,668 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:48:32,668 - ERROR - Input document 4_2024-07-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:48:32,670 - INFO - Going to convert document batch...
2025-11-14 16:48:32,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,702 - INFO - Going to convert document batch...
2025-11-14 16:48:32,702 - INFO - Processing document 4_2024-07-30
2025-11-14 16:48:32,737 - INFO - Fin

Converted 'data\edgar_documents\HON\4_2024-07-02' --> 'data\processed_data\HON\4_2024-07-02.md'
Error processing data\edgar_documents\HON\4_2024-07-29: File format not allowed: data\edgar_documents\HON\4_2024-07-29
Converted 'data\edgar_documents\HON\4_2024-07-30' --> 'data\processed_data\HON\4_2024-07-30.md'
Error processing data\edgar_documents\HON\4_2024-07-31: File format not allowed: data\edgar_documents\HON\4_2024-07-31


2025-11-14 16:48:32,831 - INFO - Finished converting document 4_2024-08-01 in 0.05 sec.
2025-11-14 16:48:32,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,882 - INFO - Going to convert document batch...
2025-11-14 16:48:32,884 - INFO - Processing document 4_2024-08-16
2025-11-14 16:48:32,917 - INFO - Finished converting document 4_2024-08-16 in 0.06 sec.
2025-11-14 16:48:32,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:32,962 - INFO - Going to convert document batch...
2025-11-14 16:48:32,962 - INFO - Processing document 4_2024-10-03
2025-11-14 16:48:32,984 - INFO - Finished converting document 4_2024-10-03 in 0.05 sec.
2025-11-14 16:48:33,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:33,048 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\4_2024-08-01' --> 'data\processed_data\HON\4_2024-08-01.md'
Converted 'data\edgar_documents\HON\4_2024-08-16' --> 'data\processed_data\HON\4_2024-08-16.md'
Converted 'data\edgar_documents\HON\4_2024-10-03' --> 'data\processed_data\HON\4_2024-10-03.md'


2025-11-14 16:48:33,048 - INFO - Processing document 4_2024-10-07
2025-11-14 16:48:33,080 - INFO - Finished converting document 4_2024-10-07 in 0.08 sec.
2025-11-14 16:48:33,145 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:48:33,147 - ERROR - Input document 4_2024-10-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:48:33,148 - INFO - Going to convert document batch...
2025-11-14 16:48:33,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48

Converted 'data\edgar_documents\HON\4_2024-10-07' --> 'data\processed_data\HON\4_2024-10-07.md'
Error processing data\edgar_documents\HON\4_2024-10-24: File format not allowed: data\edgar_documents\HON\4_2024-10-24
Converted 'data\edgar_documents\HON\4_2024-10-29' --> 'data\processed_data\HON\4_2024-10-29.md'


2025-11-14 16:48:33,560 - INFO - Going to convert document batch...
2025-11-14 16:48:33,561 - INFO - Processing document 4_2024-10-30
2025-11-14 16:48:33,600 - INFO - Finished converting document 4_2024-10-30 in 0.38 sec.
2025-11-14 16:48:33,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:33,687 - INFO - Going to convert document batch...
2025-11-14 16:48:33,688 - INFO - Processing document 4_2024-11-07
2025-11-14 16:48:33,721 - INFO - Finished converting document 4_2024-11-07 in 0.08 sec.
2025-11-14 16:48:33,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:33,783 - INFO - Going to convert document batch...
2025-11-14 16:48:33,784 - INFO - Processing document 4_2024-11-13
2025-11-14 16:48:33,818 - INFO - Finished converting document 4_2024-11-13 in 0.06 sec.


Converted 'data\edgar_documents\HON\4_2024-10-30' --> 'data\processed_data\HON\4_2024-10-30.md'
Converted 'data\edgar_documents\HON\4_2024-11-07' --> 'data\processed_data\HON\4_2024-11-07.md'
Converted 'data\edgar_documents\HON\4_2024-11-13' --> 'data\processed_data\HON\4_2024-11-13.md'


2025-11-14 16:48:33,866 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:33,878 - INFO - Going to convert document batch...
2025-11-14 16:48:33,878 - INFO - Processing document 4_2024-11-18
2025-11-14 16:48:33,909 - INFO - Finished converting document 4_2024-11-18 in 0.06 sec.
2025-11-14 16:48:33,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:33,963 - INFO - Going to convert document batch...
2025-11-14 16:48:33,964 - INFO - Processing document 4_2024-12-18
2025-11-14 16:48:33,986 - INFO - Finished converting document 4_2024-12-18 in 0.05 sec.
2025-11-14 16:48:34,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,029 - INFO - Going to convert document batch...
2025-11-14 16:48:34,030 - INFO - Processing document 4_2025-01-06
2025-11-14 16:48:34,055 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 16:48:34,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\HON\4_2024-11-18' --> 'data\processed_data\HON\4_2024-11-18.md'
Converted 'data\edgar_documents\HON\4_2024-12-18' --> 'data\processed_data\HON\4_2024-12-18.md'
Converted 'data\edgar_documents\HON\4_2025-01-06' --> 'data\processed_data\HON\4_2025-01-06.md'


2025-11-14 16:48:34,129 - INFO - Finished converting document 4_2025-02-11 in 0.05 sec.
2025-11-14 16:48:34,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,195 - INFO - Going to convert document batch...
2025-11-14 16:48:34,196 - INFO - Processing document 4_2025-02-12
2025-11-14 16:48:34,221 - INFO - Finished converting document 4_2025-02-12 in 0.06 sec.
2025-11-14 16:48:34,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,276 - INFO - Going to convert document batch...
2025-11-14 16:48:34,277 - INFO - Processing document 4_2025-02-13
2025-11-14 16:48:34,311 - INFO - Finished converting document 4_2025-02-13 in 0.06 sec.


Converted 'data\edgar_documents\HON\4_2025-02-11' --> 'data\processed_data\HON\4_2025-02-11.md'
Converted 'data\edgar_documents\HON\4_2025-02-12' --> 'data\processed_data\HON\4_2025-02-12.md'


2025-11-14 16:48:34,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,363 - INFO - Going to convert document batch...
2025-11-14 16:48:34,364 - INFO - Processing document 4_2025-02-14
2025-11-14 16:48:34,403 - INFO - Finished converting document 4_2025-02-14 in 0.06 sec.
2025-11-14 16:48:34,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,451 - INFO - Going to convert document batch...
2025-11-14 16:48:34,452 - INFO - Processing document 4_2025-02-18
2025-11-14 16:48:34,472 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 16:48:34,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,518 - INFO - Going to convert document batch...
2025-11-14 16:48:34,519 - INFO - Processing document 4_2025-02-20


Converted 'data\edgar_documents\HON\4_2025-02-13' --> 'data\processed_data\HON\4_2025-02-13.md'
Converted 'data\edgar_documents\HON\4_2025-02-14' --> 'data\processed_data\HON\4_2025-02-14.md'
Converted 'data\edgar_documents\HON\4_2025-02-18' --> 'data\processed_data\HON\4_2025-02-18.md'


2025-11-14 16:48:34,544 - INFO - Finished converting document 4_2025-02-20 in 0.06 sec.
2025-11-14 16:48:34,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,612 - INFO - Going to convert document batch...
2025-11-14 16:48:34,613 - INFO - Processing document 4_2025-02-21
2025-11-14 16:48:34,643 - INFO - Finished converting document 4_2025-02-21 in 0.06 sec.
2025-11-14 16:48:34,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,693 - INFO - Going to convert document batch...
2025-11-14 16:48:34,694 - INFO - Processing document 4_2025-02-27
2025-11-14 16:48:34,722 - INFO - Finished converting document 4_2025-02-27 in 0.05 sec.
2025-11-14 16:48:34,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,767 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\4_2025-02-20' --> 'data\processed_data\HON\4_2025-02-20.md'
Converted 'data\edgar_documents\HON\4_2025-02-21' --> 'data\processed_data\HON\4_2025-02-21.md'
Converted 'data\edgar_documents\HON\4_2025-02-27' --> 'data\processed_data\HON\4_2025-02-27.md'


2025-11-14 16:48:34,768 - INFO - Processing document 4_2025-04-03
2025-11-14 16:48:34,792 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.
2025-11-14 16:48:34,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:34,952 - INFO - Going to convert document batch...
2025-11-14 16:48:34,953 - INFO - Processing document 4_2025-04-17
2025-11-14 16:48:34,977 - INFO - Finished converting document 4_2025-04-17 in 0.08 sec.
2025-11-14 16:48:35,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:35,028 - INFO - Going to convert document batch...
2025-11-14 16:48:35,029 - INFO - Processing document 4_2025-04-25
2025-11-14 16:48:35,055 - INFO - Finished converting document 4_2025-04-25 in 0.05 sec.
2025-11-14 16:48:35,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\4_2025-04-03' --> 'data\processed_data\HON\4_2025-04-03.md'
Converted 'data\edgar_documents\HON\4_2025-04-17' --> 'data\processed_data\HON\4_2025-04-17.md'
Converted 'data\edgar_documents\HON\4_2025-04-25' --> 'data\processed_data\HON\4_2025-04-25.md'


2025-11-14 16:48:35,103 - INFO - Going to convert document batch...
2025-11-14 16:48:35,103 - INFO - Processing document 4_2025-05-05
2025-11-14 16:48:35,128 - INFO - Finished converting document 4_2025-05-05 in 0.05 sec.
2025-11-14 16:48:35,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:35,177 - INFO - Going to convert document batch...
2025-11-14 16:48:35,179 - INFO - Processing document 4_2025-05-21
2025-11-14 16:48:35,200 - INFO - Finished converting document 4_2025-05-21 in 0.05 sec.
2025-11-14 16:48:35,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:35,246 - INFO - Going to convert document batch...
2025-11-14 16:48:35,247 - INFO - Processing document 4_2025-06-03
2025-11-14 16:48:35,274 - INFO - Finished converting document 4_2025-06-03 in 0.05 sec.
2025-11-14 16:48:35,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:35,320 - INFO - Going to convert document batch...
2025-11-14 16:48:35,321 - 

Converted 'data\edgar_documents\HON\4_2025-05-05' --> 'data\processed_data\HON\4_2025-05-05.md'
Converted 'data\edgar_documents\HON\4_2025-05-21' --> 'data\processed_data\HON\4_2025-05-21.md'
Converted 'data\edgar_documents\HON\4_2025-06-03' --> 'data\processed_data\HON\4_2025-06-03.md'


2025-11-14 16:48:35,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:35,401 - INFO - Going to convert document batch...
2025-11-14 16:48:35,402 - INFO - Processing document 4_2025-07-02
2025-11-14 16:48:35,438 - INFO - Finished converting document 4_2025-07-02 in 0.06 sec.
2025-11-14 16:48:35,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:35,504 - INFO - Going to convert document batch...
2025-11-14 16:48:35,505 - INFO - Processing document 4_2025-07-16
2025-11-14 16:48:35,530 - INFO - Finished converting document 4_2025-07-16 in 0.06 sec.
2025-11-14 16:48:35,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\4_2025-06-04' --> 'data\processed_data\HON\4_2025-06-04.md'
Converted 'data\edgar_documents\HON\4_2025-07-02' --> 'data\processed_data\HON\4_2025-07-02.md'
Converted 'data\edgar_documents\HON\4_2025-07-16' --> 'data\processed_data\HON\4_2025-07-16.md'


2025-11-14 16:48:35,579 - INFO - Going to convert document batch...
2025-11-14 16:48:35,579 - INFO - Processing document 4_2025-07-29
2025-11-14 16:48:35,623 - INFO - Finished converting document 4_2025-07-29 in 0.06 sec.
2025-11-14 16:48:35,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:35,678 - INFO - Going to convert document batch...
2025-11-14 16:48:35,678 - INFO - Processing document 4_2025-07-30
2025-11-14 16:48:35,704 - INFO - Finished converting document 4_2025-07-30 in 0.05 sec.
2025-11-14 16:48:35,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:35,749 - INFO - Going to convert document batch...
2025-11-14 16:48:35,750 - INFO - Processing document 4_2025-08-04
2025-11-14 16:48:35,777 - INFO - Finished converting document 4_2025-08-04 in 0.06 sec.
2025-11-14 16:48:35,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:35,840 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\4_2025-07-29' --> 'data\processed_data\HON\4_2025-07-29.md'
Converted 'data\edgar_documents\HON\4_2025-07-30' --> 'data\processed_data\HON\4_2025-07-30.md'
Converted 'data\edgar_documents\HON\4_2025-08-04' --> 'data\processed_data\HON\4_2025-08-04.md'


2025-11-14 16:48:35,840 - INFO - Processing document 4_2025-08-28
2025-11-14 16:48:35,883 - INFO - Finished converting document 4_2025-08-28 in 0.06 sec.
2025-11-14 16:48:36,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:36,056 - INFO - Going to convert document batch...
2025-11-14 16:48:36,057 - INFO - Processing document 4_2025-09-02
2025-11-14 16:48:36,075 - INFO - Finished converting document 4_2025-09-02 in 0.08 sec.
2025-11-14 16:48:36,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:36,126 - INFO - Going to convert document batch...
2025-11-14 16:48:36,128 - INFO - Processing document 4_2025-10-02
2025-11-14 16:48:36,152 - INFO - Finished converting document 4_2025-10-02 in 0.06 sec.
2025-11-14 16:48:36,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\4_2025-08-28' --> 'data\processed_data\HON\4_2025-08-28.md'
Converted 'data\edgar_documents\HON\4_2025-09-02' --> 'data\processed_data\HON\4_2025-09-02.md'
Converted 'data\edgar_documents\HON\4_2025-10-02' --> 'data\processed_data\HON\4_2025-10-02.md'


2025-11-14 16:48:36,214 - INFO - Going to convert document batch...
2025-11-14 16:48:36,215 - INFO - Processing document 4_2025-10-06
2025-11-14 16:48:36,252 - INFO - Finished converting document 4_2025-10-06 in 0.06 sec.
2025-11-14 16:48:36,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:36,358 - INFO - Going to convert document batch...
2025-11-14 16:48:36,360 - INFO - Processing document 4_2025-10-15
2025-11-14 16:48:36,392 - INFO - Finished converting document 4_2025-10-15 in 0.11 sec.
2025-11-14 16:48:36,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:36,454 - INFO - Going to convert document batch...
2025-11-14 16:48:36,455 - INFO - Processing document 4_2025-10-29
2025-11-14 16:48:36,484 - INFO - Finished converting document 4_2025-10-29 in 0.08 sec.


Converted 'data\edgar_documents\HON\4_2025-10-06' --> 'data\processed_data\HON\4_2025-10-06.md'
Converted 'data\edgar_documents\HON\4_2025-10-15' --> 'data\processed_data\HON\4_2025-10-15.md'


2025-11-14 16:48:36,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:36,537 - INFO - Going to convert document batch...
2025-11-14 16:48:36,538 - INFO - Processing document 4_2025-10-30
2025-11-14 16:48:36,561 - INFO - Finished converting document 4_2025-10-30 in 0.05 sec.
2025-11-14 16:48:36,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:36,613 - INFO - Going to convert document batch...
2025-11-14 16:48:36,614 - INFO - Processing document 4_2025-11-05
2025-11-14 16:48:36,661 - INFO - Finished converting document 4_2025-11-05 in 0.08 sec.
2025-11-14 16:48:36,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\4_2025-10-29' --> 'data\processed_data\HON\4_2025-10-29.md'
Converted 'data\edgar_documents\HON\4_2025-10-30' --> 'data\processed_data\HON\4_2025-10-30.md'
Converted 'data\edgar_documents\HON\4_2025-11-05' --> 'data\processed_data\HON\4_2025-11-05.md'


2025-11-14 16:48:36,717 - INFO - Going to convert document batch...
2025-11-14 16:48:36,718 - INFO - Processing document 8-K_2023-02-02
2025-11-14 16:48:36,808 - INFO - Finished converting document 8-K_2023-02-02 in 0.12 sec.
2025-11-14 16:48:36,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:36,902 - INFO - Going to convert document batch...
2025-11-14 16:48:36,903 - INFO - Processing document 8-K_2023-03-14
2025-11-14 16:48:36,928 - INFO - Finished converting document 8-K_2023-03-14 in 0.09 sec.
2025-11-14 16:48:36,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:36,977 - INFO - Going to convert document batch...
2025-11-14 16:48:36,978 - INFO - Processing document 8-K_2023-03-21
2025-11-14 16:48:37,008 - INFO - Finished converting document 8-K_2023-03-21 in 0.06 sec.


Converted 'data\edgar_documents\HON\8-K_2023-02-02' --> 'data\processed_data\HON\8-K_2023-02-02.md'
Converted 'data\edgar_documents\HON\8-K_2023-03-14' --> 'data\processed_data\HON\8-K_2023-03-14.md'


2025-11-14 16:48:37,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:37,059 - INFO - Going to convert document batch...
2025-11-14 16:48:37,060 - INFO - Processing document 8-K_2023-04-24
2025-11-14 16:48:37,081 - INFO - Finished converting document 8-K_2023-04-24 in 0.06 sec.
2025-11-14 16:48:37,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:37,141 - INFO - Going to convert document batch...
2025-11-14 16:48:37,142 - INFO - Processing document 8-K_2023-04-27


Converted 'data\edgar_documents\HON\8-K_2023-03-21' --> 'data\processed_data\HON\8-K_2023-03-21.md'
Converted 'data\edgar_documents\HON\8-K_2023-04-24' --> 'data\processed_data\HON\8-K_2023-04-24.md'


2025-11-14 16:48:37,247 - INFO - Finished converting document 8-K_2023-04-27 in 0.16 sec.
2025-11-14 16:48:37,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:37,331 - INFO - Going to convert document batch...
2025-11-14 16:48:37,332 - INFO - Processing document 8-K_2023-05-17
2025-11-14 16:48:37,363 - INFO - Finished converting document 8-K_2023-05-17 in 0.09 sec.
2025-11-14 16:48:37,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:37,457 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\8-K_2023-04-27' --> 'data\processed_data\HON\8-K_2023-04-27.md'
Converted 'data\edgar_documents\HON\8-K_2023-05-17' --> 'data\processed_data\HON\8-K_2023-05-17.md'


2025-11-14 16:48:37,458 - INFO - Processing document 8-K_2023-05-23
2025-11-14 16:48:37,528 - INFO - Finished converting document 8-K_2023-05-23 in 0.16 sec.
2025-11-14 16:48:37,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:37,706 - INFO - Going to convert document batch...
2025-11-14 16:48:37,707 - INFO - Processing document 8-K_2023-06-06
2025-11-14 16:48:37,726 - INFO - Finished converting document 8-K_2023-06-06 in 0.06 sec.
2025-11-14 16:48:37,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:37,770 - INFO - Going to convert document batch...
2025-11-14 16:48:37,772 - INFO - Processing document 8-K_2023-06-15
2025-11-14 16:48:37,789 - INFO - Finished converting document 8-K_2023-06-15 in 0.05 sec.
2025-11-14 16:48:37,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:37,831 - INFO - Going to convert document batch...
2025-11-14 16:48:37,832 - INFO - Processing document 8-K_2023-07-27


Converted 'data\edgar_documents\HON\8-K_2023-05-23' --> 'data\processed_data\HON\8-K_2023-05-23.md'
Converted 'data\edgar_documents\HON\8-K_2023-06-06' --> 'data\processed_data\HON\8-K_2023-06-06.md'
Converted 'data\edgar_documents\HON\8-K_2023-06-15' --> 'data\processed_data\HON\8-K_2023-06-15.md'


2025-11-14 16:48:37,857 - INFO - Finished converting document 8-K_2023-07-27 in 0.06 sec.
2025-11-14 16:48:37,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:37,923 - INFO - Going to convert document batch...
2025-11-14 16:48:37,924 - INFO - Processing document 8-K_2023-10-10
2025-11-14 16:48:37,957 - INFO - Finished converting document 8-K_2023-10-10 in 0.08 sec.
2025-11-14 16:48:37,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:38,003 - INFO - Going to convert document batch...
2025-11-14 16:48:38,004 - INFO - Processing document 8-K_2023-10-26
2025-11-14 16:48:38,029 - INFO - Finished converting document 8-K_2023-10-26 in 0.06 sec.
2025-11-14 16:48:38,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\8-K_2023-07-27' --> 'data\processed_data\HON\8-K_2023-07-27.md'
Converted 'data\edgar_documents\HON\8-K_2023-10-10' --> 'data\processed_data\HON\8-K_2023-10-10.md'
Converted 'data\edgar_documents\HON\8-K_2023-10-26' --> 'data\processed_data\HON\8-K_2023-10-26.md'


2025-11-14 16:48:38,074 - INFO - Going to convert document batch...
2025-11-14 16:48:38,075 - INFO - Processing document 8-K_2023-11-28
2025-11-14 16:48:38,112 - INFO - Finished converting document 8-K_2023-11-28 in 0.06 sec.
2025-11-14 16:48:38,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:38,170 - INFO - Going to convert document batch...
2025-11-14 16:48:38,172 - INFO - Processing document 8-K_2023-12-11
2025-11-14 16:48:38,194 - INFO - Finished converting document 8-K_2023-12-11 in 0.06 sec.
2025-11-14 16:48:38,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\8-K_2023-11-28' --> 'data\processed_data\HON\8-K_2023-11-28.md'
Converted 'data\edgar_documents\HON\8-K_2023-12-11' --> 'data\processed_data\HON\8-K_2023-12-11.md'


2025-11-14 16:48:38,437 - INFO - Going to convert document batch...
2025-11-14 16:48:38,438 - INFO - Processing document 8-K_2024-02-01
2025-11-14 16:48:38,460 - INFO - Finished converting document 8-K_2024-02-01 in 0.25 sec.
2025-11-14 16:48:38,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:38,538 - INFO - Going to convert document batch...
2025-11-14 16:48:38,540 - INFO - Processing document 8-K_2024-03-01
2025-11-14 16:48:38,570 - INFO - Finished converting document 8-K_2024-03-01 in 0.09 sec.
2025-11-14 16:48:38,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:38,615 - INFO - Going to convert document batch...
2025-11-14 16:48:38,616 - INFO - Processing document 8-K_2024-03-19
2025-11-14 16:48:38,640 - INFO - Finished converting document 8-K_2024-03-19 in 0.06 sec.
2025-11-14 16:48:38,666 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\8-K_2024-02-01' --> 'data\processed_data\HON\8-K_2024-02-01.md'
Converted 'data\edgar_documents\HON\8-K_2024-03-01' --> 'data\processed_data\HON\8-K_2024-03-01.md'
Converted 'data\edgar_documents\HON\8-K_2024-03-19' --> 'data\processed_data\HON\8-K_2024-03-19.md'


2025-11-14 16:48:38,699 - INFO - Going to convert document batch...
2025-11-14 16:48:38,700 - INFO - Processing document 8-K_2024-04-25
2025-11-14 16:48:38,738 - INFO - Finished converting document 8-K_2024-04-25 in 0.08 sec.
2025-11-14 16:48:38,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:38,813 - INFO - Going to convert document batch...
2025-11-14 16:48:38,815 - INFO - Processing document 8-K_2024-05-16
2025-11-14 16:48:38,860 - INFO - Finished converting document 8-K_2024-05-16 in 0.11 sec.


Converted 'data\edgar_documents\HON\8-K_2024-04-25' --> 'data\processed_data\HON\8-K_2024-04-25.md'
Converted 'data\edgar_documents\HON\8-K_2024-05-16' --> 'data\processed_data\HON\8-K_2024-05-16.md'


2025-11-14 16:48:38,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:38,948 - INFO - Going to convert document batch...
2025-11-14 16:48:38,949 - INFO - Processing document 8-K_2024-06-03
2025-11-14 16:48:38,984 - INFO - Finished converting document 8-K_2024-06-03 in 0.09 sec.
2025-11-14 16:48:39,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,025 - INFO - Going to convert document batch...
2025-11-14 16:48:39,026 - INFO - Processing document 8-K_2024-06-11
2025-11-14 16:48:39,049 - INFO - Finished converting document 8-K_2024-06-11 in 0.05 sec.
2025-11-14 16:48:39,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,105 - INFO - Going to convert document batch...
2025-11-14 16:48:39,106 - INFO - Processing document 8-K_2024-07-02
2025-11-14 16:48:39,135 - INFO - Finished converting document 8-K_2024-07-02 in 0.06 sec.
2025-11-14 16:48:39,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\HON\8-K_2024-06-03' --> 'data\processed_data\HON\8-K_2024-06-03.md'
Converted 'data\edgar_documents\HON\8-K_2024-06-11' --> 'data\processed_data\HON\8-K_2024-06-11.md'
Converted 'data\edgar_documents\HON\8-K_2024-07-02' --> 'data\processed_data\HON\8-K_2024-07-02.md'


2025-11-14 16:48:39,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,248 - INFO - Going to convert document batch...
2025-11-14 16:48:39,250 - INFO - Processing document 8-K_2024-07-25
2025-11-14 16:48:39,278 - INFO - Finished converting document 8-K_2024-07-25 in 0.06 sec.
2025-11-14 16:48:39,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,323 - INFO - Going to convert document batch...
2025-11-14 16:48:39,324 - INFO - Processing document 8-K_2024-08-02
2025-11-14 16:48:39,357 - INFO - Finished converting document 8-K_2024-08-02 in 0.08 sec.
2025-11-14 16:48:39,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,401 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\8-K_2024-07-10' --> 'data\processed_data\HON\8-K_2024-07-10.md'
Converted 'data\edgar_documents\HON\8-K_2024-07-25' --> 'data\processed_data\HON\8-K_2024-07-25.md'
Converted 'data\edgar_documents\HON\8-K_2024-08-02' --> 'data\processed_data\HON\8-K_2024-08-02.md'


2025-11-14 16:48:39,402 - INFO - Processing document 8-K_2024-08-12
2025-11-14 16:48:39,430 - INFO - Finished converting document 8-K_2024-08-12 in 0.05 sec.
2025-11-14 16:48:39,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,478 - INFO - Going to convert document batch...
2025-11-14 16:48:39,478 - INFO - Processing document 8-K_2024-09-05
2025-11-14 16:48:39,502 - INFO - Finished converting document 8-K_2024-09-05 in 0.05 sec.
2025-11-14 16:48:39,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,542 - INFO - Going to convert document batch...
2025-11-14 16:48:39,543 - INFO - Processing document 8-K_2024-10-08
2025-11-14 16:48:39,565 - INFO - Finished converting document 8-K_2024-10-08 in 0.05 sec.
2025-11-14 16:48:39,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,628 - INFO - Going to convert document batch...
2025-11-14 16:48:39,628 - INFO - Processing document 8-K_2024-10-24
2025-11-14 16:

Converted 'data\edgar_documents\HON\8-K_2024-08-12' --> 'data\processed_data\HON\8-K_2024-08-12.md'
Converted 'data\edgar_documents\HON\8-K_2024-09-05' --> 'data\processed_data\HON\8-K_2024-09-05.md'
Converted 'data\edgar_documents\HON\8-K_2024-10-08' --> 'data\processed_data\HON\8-K_2024-10-08.md'


2025-11-14 16:48:39,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,702 - INFO - Going to convert document batch...
2025-11-14 16:48:39,704 - INFO - Processing document 8-K_2024-12-02
2025-11-14 16:48:39,753 - INFO - Finished converting document 8-K_2024-12-02 in 0.08 sec.
2025-11-14 16:48:39,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,796 - INFO - Going to convert document batch...
2025-11-14 16:48:39,798 - INFO - Processing document 8-K_2025-02-06
2025-11-14 16:48:39,822 - INFO - Finished converting document 8-K_2025-02-06 in 0.05 sec.
2025-11-14 16:48:39,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,864 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\8-K_2024-10-24' --> 'data\processed_data\HON\8-K_2024-10-24.md'
Converted 'data\edgar_documents\HON\8-K_2024-12-02' --> 'data\processed_data\HON\8-K_2024-12-02.md'
Converted 'data\edgar_documents\HON\8-K_2025-02-06' --> 'data\processed_data\HON\8-K_2025-02-06.md'


2025-11-14 16:48:39,865 - INFO - Processing document 8-K_2025-02-18
2025-11-14 16:48:39,909 - INFO - Finished converting document 8-K_2025-02-18 in 0.08 sec.
2025-11-14 16:48:39,950 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:39,968 - INFO - Going to convert document batch...
2025-11-14 16:48:39,968 - INFO - Processing document 8-K_2025-03-17
2025-11-14 16:48:39,994 - INFO - Finished converting document 8-K_2025-03-17 in 0.06 sec.
2025-11-14 16:48:40,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:40,038 - INFO - Going to convert document batch...
2025-11-14 16:48:40,038 - INFO - Processing document 8-K_2025-04-01
2025-11-14 16:48:40,062 - INFO - Finished converting document 8-K_2025-04-01 in 0.06 sec.
2025-11-14 16:48:40,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:40,104 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\8-K_2025-02-18' --> 'data\processed_data\HON\8-K_2025-02-18.md'
Converted 'data\edgar_documents\HON\8-K_2025-03-17' --> 'data\processed_data\HON\8-K_2025-03-17.md'
Converted 'data\edgar_documents\HON\8-K_2025-04-01' --> 'data\processed_data\HON\8-K_2025-04-01.md'


2025-11-14 16:48:40,105 - INFO - Processing document 8-K_2025-04-08
2025-11-14 16:48:40,128 - INFO - Finished converting document 8-K_2025-04-08 in 0.05 sec.
2025-11-14 16:48:40,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:40,266 - INFO - Going to convert document batch...
2025-11-14 16:48:40,267 - INFO - Processing document 8-K_2025-04-29
2025-11-14 16:48:40,297 - INFO - Finished converting document 8-K_2025-04-29 in 0.16 sec.


Converted 'data\edgar_documents\HON\8-K_2025-04-08' --> 'data\processed_data\HON\8-K_2025-04-08.md'
Converted 'data\edgar_documents\HON\8-K_2025-04-29' --> 'data\processed_data\HON\8-K_2025-04-29.md'


2025-11-14 16:48:40,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:40,385 - INFO - Going to convert document batch...
2025-11-14 16:48:40,386 - INFO - Processing document 8-K_2025-05-08
2025-11-14 16:48:40,417 - INFO - Finished converting document 8-K_2025-05-08 in 0.11 sec.
2025-11-14 16:48:40,454 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:40,478 - INFO - Going to convert document batch...
2025-11-14 16:48:40,479 - INFO - Processing document 8-K_2025-05-23
2025-11-14 16:48:40,527 - INFO - Finished converting document 8-K_2025-05-23 in 0.09 sec.
2025-11-14 16:48:40,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\8-K_2025-05-08' --> 'data\processed_data\HON\8-K_2025-05-08.md'
Converted 'data\edgar_documents\HON\8-K_2025-05-23' --> 'data\processed_data\HON\8-K_2025-05-23.md'


2025-11-14 16:48:40,644 - INFO - Going to convert document batch...
2025-11-14 16:48:40,645 - INFO - Processing document 8-K_2025-05-28
2025-11-14 16:48:40,746 - INFO - Finished converting document 8-K_2025-05-28 in 0.19 sec.
2025-11-14 16:48:40,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:40,842 - INFO - Going to convert document batch...
2025-11-14 16:48:40,843 - INFO - Processing document 8-K_2025-06-24
2025-11-14 16:48:40,875 - INFO - Finished converting document 8-K_2025-06-24 in 0.09 sec.
2025-11-14 16:48:40,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:40,935 - INFO - Going to convert document batch...
2025-11-14 16:48:40,935 - INFO - Processing document 8-K_2025-07-24
2025-11-14 16:48:40,967 - INFO - Finished converting document 8-K_2025-07-24 in 0.08 sec.


Converted 'data\edgar_documents\HON\8-K_2025-05-28' --> 'data\processed_data\HON\8-K_2025-05-28.md'
Converted 'data\edgar_documents\HON\8-K_2025-06-24' --> 'data\processed_data\HON\8-K_2025-06-24.md'


2025-11-14 16:48:41,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:41,037 - INFO - Going to convert document batch...
2025-11-14 16:48:41,038 - INFO - Processing document 8-K_2025-07-30
2025-11-14 16:48:41,078 - INFO - Finished converting document 8-K_2025-07-30 in 0.09 sec.
2025-11-14 16:48:41,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:41,129 - INFO - Going to convert document batch...
2025-11-14 16:48:41,130 - INFO - Processing document 8-K_2025-08-21
2025-11-14 16:48:41,154 - INFO - Finished converting document 8-K_2025-08-21 in 0.06 sec.
2025-11-14 16:48:41,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\8-K_2025-07-24' --> 'data\processed_data\HON\8-K_2025-07-24.md'
Converted 'data\edgar_documents\HON\8-K_2025-07-30' --> 'data\processed_data\HON\8-K_2025-07-30.md'
Converted 'data\edgar_documents\HON\8-K_2025-08-21' --> 'data\processed_data\HON\8-K_2025-08-21.md'


2025-11-14 16:48:41,195 - INFO - Going to convert document batch...
2025-11-14 16:48:41,196 - INFO - Processing document 8-K_2025-08-22
2025-11-14 16:48:41,301 - INFO - Finished converting document 8-K_2025-08-22 in 0.12 sec.
2025-11-14 16:48:41,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:41,385 - INFO - Going to convert document batch...
2025-11-14 16:48:41,385 - INFO - Processing document 8-K_2025-10-01
2025-11-14 16:48:41,410 - INFO - Finished converting document 8-K_2025-10-01 in 0.06 sec.
2025-11-14 16:48:41,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:41,457 - INFO - Going to convert document batch...
2025-11-14 16:48:41,458 - INFO - Processing document 8-K_2025-10-16
2025-11-14 16:48:41,484 - INFO - Finished converting document 8-K_2025-10-16 in 0.06 sec.
2025-11-14 16:48:41,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:41,526 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\HON\8-K_2025-08-22' --> 'data\processed_data\HON\8-K_2025-08-22.md'
Converted 'data\edgar_documents\HON\8-K_2025-10-01' --> 'data\processed_data\HON\8-K_2025-10-01.md'
Converted 'data\edgar_documents\HON\8-K_2025-10-16' --> 'data\processed_data\HON\8-K_2025-10-16.md'


2025-11-14 16:48:41,527 - INFO - Processing document 8-K_2025-10-22
2025-11-14 16:48:41,549 - INFO - Finished converting document 8-K_2025-10-22 in 0.05 sec.
2025-11-14 16:48:41,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:41,603 - INFO - Going to convert document batch...
2025-11-14 16:48:41,604 - INFO - Processing document 8-K_2025-10-23
2025-11-14 16:48:41,627 - INFO - Finished converting document 8-K_2025-10-23 in 0.06 sec.
2025-11-14 16:48:41,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:41,670 - INFO - Going to convert document batch...
2025-11-14 16:48:41,671 - INFO - Processing document 8-K_2025-10-30
2025-11-14 16:48:41,694 - INFO - Finished converting document 8-K_2025-10-30 in 0.05 sec.
2025-11-14 16:48:41,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:48:41,734 - INFO - Going to convert document batch...
2025-11-14 16:48:41,734 - INFO - Processing document 8-K_2025-11-03
2025-11-14 16:

Converted 'data\edgar_documents\HON\8-K_2025-10-22' --> 'data\processed_data\HON\8-K_2025-10-22.md'
Converted 'data\edgar_documents\HON\8-K_2025-10-23' --> 'data\processed_data\HON\8-K_2025-10-23.md'
Converted 'data\edgar_documents\HON\8-K_2025-10-30' --> 'data\processed_data\HON\8-K_2025-10-30.md'


2025-11-14 16:48:41,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\8-K_2025-11-03' --> 'data\processed_data\HON\8-K_2025-11-03.md'


2025-11-14 16:48:42,931 - INFO - Going to convert document batch...
2025-11-14 16:48:42,932 - INFO - Processing document DEF-14A_2023-04-06
2025-11-14 16:48:49,088 - INFO - Finished converting document DEF-14A_2023-04-06 in 7.31 sec.
2025-11-14 16:48:50,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\DEF-14A_2023-04-06' --> 'data\processed_data\HON\DEF-14A_2023-04-06.md'


2025-11-14 16:48:51,542 - INFO - Going to convert document batch...
2025-11-14 16:48:51,543 - INFO - Processing document DEF-14A_2024-04-02
2025-11-14 16:48:58,304 - INFO - Finished converting document DEF-14A_2024-04-02 in 7.64 sec.
2025-11-14 16:49:00,215 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\DEF-14A_2024-04-02' --> 'data\processed_data\HON\DEF-14A_2024-04-02.md'


2025-11-14 16:49:01,717 - INFO - Going to convert document batch...
2025-11-14 16:49:01,718 - INFO - Processing document DEF-14A_2025-04-09
2025-11-14 16:49:08,162 - INFO - Finished converting document DEF-14A_2025-04-09 in 8.08 sec.
2025-11-14 16:49:10,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\HON\DEF-14A_2025-04-09' --> 'data\processed_data\HON\DEF-14A_2025-04-09.md'
Processed 150 new files. Errors: 8
Found 116 files to process in data\edgar_documents\IBM


2025-11-14 16:49:10,596 - INFO - Going to convert document batch...
2025-11-14 16:49:10,597 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:49:10,598 - INFO - Processing document 10-K_2023-02-28
2025-11-14 16:49:11,296 - INFO - Finished converting document 10-K_2023-02-28 in 1.23 sec.
2025-11-14 16:49:11,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\10-K_2023-02-28' --> 'data\processed_data\IBM\10-K_2023-02-28.md'


2025-11-14 16:49:12,441 - INFO - Going to convert document batch...
2025-11-14 16:49:12,442 - INFO - Processing document 10-K_2024-02-26
2025-11-14 16:49:12,980 - INFO - Finished converting document 10-K_2024-02-26 in 1.47 sec.
2025-11-14 16:49:13,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\10-K_2024-02-26' --> 'data\processed_data\IBM\10-K_2024-02-26.md'


2025-11-14 16:49:13,693 - INFO - Going to convert document batch...
2025-11-14 16:49:13,695 - INFO - Processing document 10-K_2025-02-25
2025-11-14 16:49:14,196 - INFO - Finished converting document 10-K_2025-02-25 in 1.05 sec.
2025-11-14 16:49:14,512 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:49:14,513 - ERROR - Input document 10-Q_2023-04-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:49:14,517 - INFO - Going to convert d

Converted 'data\edgar_documents\IBM\10-K_2025-02-25' --> 'data\processed_data\IBM\10-K_2025-02-25.md'
Error processing data\edgar_documents\IBM\10-Q_2023-04-25: File format not allowed: data\edgar_documents\IBM\10-Q_2023-04-25


2025-11-14 16:49:16,184 - INFO - Going to convert document batch...
2025-11-14 16:49:16,185 - INFO - Processing document 10-Q_2023-07-25
2025-11-14 16:49:18,989 - INFO - Finished converting document 10-Q_2023-07-25 in 4.47 sec.
2025-11-14 16:49:20,278 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\IBM\10-Q_2023-07-25' --> 'data\processed_data\IBM\10-Q_2023-07-25.md'


2025-11-14 16:49:20,279 - ERROR - Input document 10-Q_2023-10-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:49:20,283 - INFO - Going to convert document batch...
2025-11-14 16:49:20,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\IBM\10-Q_2023-10-31: File format not allowed: data\edgar_documents\IBM\10-Q_2023-10-31


2025-11-14 16:49:21,077 - INFO - Going to convert document batch...
2025-11-14 16:49:21,078 - INFO - Processing document 10-Q_2024-04-30
2025-11-14 16:49:23,445 - INFO - Finished converting document 10-Q_2024-04-30 in 3.16 sec.
2025-11-14 16:49:24,270 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\10-Q_2024-04-30' --> 'data\processed_data\IBM\10-Q_2024-04-30.md'


2025-11-14 16:49:25,445 - INFO - Going to convert document batch...
2025-11-14 16:49:25,445 - INFO - Processing document 10-Q_2024-07-30
2025-11-14 16:49:28,774 - INFO - Finished converting document 10-Q_2024-07-30 in 4.66 sec.
2025-11-14 16:49:29,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\10-Q_2024-07-30' --> 'data\processed_data\IBM\10-Q_2024-07-30.md'


2025-11-14 16:49:31,114 - INFO - Going to convert document batch...
2025-11-14 16:49:31,115 - INFO - Processing document 10-Q_2024-10-30
2025-11-14 16:49:34,456 - INFO - Finished converting document 10-Q_2024-10-30 in 4.69 sec.
2025-11-14 16:49:35,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\10-Q_2024-10-30' --> 'data\processed_data\IBM\10-Q_2024-10-30.md'


2025-11-14 16:49:36,540 - INFO - Going to convert document batch...
2025-11-14 16:49:36,542 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 16:49:38,354 - INFO - Finished converting document 10-Q_2025-04-24 in 2.73 sec.
2025-11-14 16:49:39,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\10-Q_2025-04-24' --> 'data\processed_data\IBM\10-Q_2025-04-24.md'


2025-11-14 16:49:41,193 - INFO - Going to convert document batch...
2025-11-14 16:49:41,194 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 16:49:43,903 - INFO - Finished converting document 10-Q_2025-07-24 in 4.86 sec.
2025-11-14 16:49:45,013 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\10-Q_2025-07-24' --> 'data\processed_data\IBM\10-Q_2025-07-24.md'


2025-11-14 16:49:46,815 - INFO - Going to convert document batch...
2025-11-14 16:49:46,816 - INFO - Processing document 10-Q_2025-10-23
2025-11-14 16:49:50,036 - INFO - Finished converting document 10-Q_2025-10-23 in 5.16 sec.
2025-11-14 16:49:51,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:51,095 - INFO - Going to convert document batch...
2025-11-14 16:49:51,096 - INFO - Processing document 4_2023-01-03
2025-11-14 16:49:51,127 - INFO - Finished converting document 4_2023-01-03 in 0.09 sec.
2025-11-14 16:49:51,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:51,210 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\IBM\10-Q_2025-10-23' --> 'data\processed_data\IBM\10-Q_2025-10-23.md'
Converted 'data\edgar_documents\IBM\4_2023-01-03' --> 'data\processed_data\IBM\4_2023-01-03.md'


2025-11-14 16:49:51,218 - INFO - Processing document 4_2023-01-05
2025-11-14 16:49:51,359 - INFO - Finished converting document 4_2023-01-05 in 0.20 sec.
2025-11-14 16:49:51,410 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:49:51,411 - ERROR - Input document 4_2023-01-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:49:51,413 - INFO - Going to convert document batch...
2025-11-14 16:49:51,441 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\IBM\4_2023-01-05' --> 'data\processed_data\IBM\4_2023-01-05.md'
Error processing data\edgar_documents\IBM\4_2023-01-30: File format not allowed: data\edgar_documents\IBM\4_2023-01-30
Error processing data\edgar_documents\IBM\4_2023-02-01: File format not allowed: data\edgar_documents\IBM\4_2023-02-01


2025-11-14 16:49:51,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:51,650 - INFO - Going to convert document batch...
2025-11-14 16:49:51,652 - INFO - Processing document 4_2023-02-13
2025-11-14 16:49:51,688 - INFO - Finished converting document 4_2023-02-13 in 0.09 sec.
2025-11-14 16:49:51,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:51,768 - INFO - Going to convert document batch...
2025-11-14 16:49:51,770 - INFO - Processing document 4_2023-02-23


Converted 'data\edgar_documents\IBM\4_2023-02-03' --> 'data\processed_data\IBM\4_2023-02-03.md'
Converted 'data\edgar_documents\IBM\4_2023-02-13' --> 'data\processed_data\IBM\4_2023-02-13.md'


2025-11-14 16:49:51,809 - INFO - Finished converting document 4_2023-02-23 in 0.08 sec.
2025-11-14 16:49:51,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:51,875 - INFO - Going to convert document batch...
2025-11-14 16:49:51,876 - INFO - Processing document 4_2023-04-03
2025-11-14 16:49:51,901 - INFO - Finished converting document 4_2023-04-03 in 0.06 sec.
2025-11-14 16:49:51,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:51,961 - INFO - Going to convert document batch...
2025-11-14 16:49:51,962 - INFO - Processing document 4_2023-05-11
2025-11-14 16:49:51,986 - INFO - Finished converting document 4_2023-05-11 in 0.05 sec.
2025-11-14 16:49:52,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\4_2023-02-23' --> 'data\processed_data\IBM\4_2023-02-23.md'
Converted 'data\edgar_documents\IBM\4_2023-04-03' --> 'data\processed_data\IBM\4_2023-04-03.md'
Converted 'data\edgar_documents\IBM\4_2023-05-11' --> 'data\processed_data\IBM\4_2023-05-11.md'


2025-11-14 16:49:52,056 - INFO - Going to convert document batch...
2025-11-14 16:49:52,057 - INFO - Processing document 4_2023-06-06
2025-11-14 16:49:52,100 - INFO - Finished converting document 4_2023-06-06 in 0.08 sec.
2025-11-14 16:49:52,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:52,278 - INFO - Going to convert document batch...
2025-11-14 16:49:52,280 - INFO - Processing document 4_2023-06-09
2025-11-14 16:49:52,320 - INFO - Finished converting document 4_2023-06-09 in 0.11 sec.
2025-11-14 16:49:52,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\4_2023-06-06' --> 'data\processed_data\IBM\4_2023-06-06.md'
Converted 'data\edgar_documents\IBM\4_2023-06-09' --> 'data\processed_data\IBM\4_2023-06-09.md'


2025-11-14 16:49:52,417 - INFO - Going to convert document batch...
2025-11-14 16:49:52,419 - INFO - Processing document 4_2023-07-05
2025-11-14 16:49:52,447 - INFO - Finished converting document 4_2023-07-05 in 0.08 sec.
2025-11-14 16:49:52,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:52,542 - INFO - Going to convert document batch...
2025-11-14 16:49:52,543 - INFO - Processing document 4_2023-08-10
2025-11-14 16:49:52,565 - INFO - Finished converting document 4_2023-08-10 in 0.08 sec.
2025-11-14 16:49:52,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:52,614 - INFO - Going to convert document batch...
2025-11-14 16:49:52,615 - INFO - Processing document 4_2023-08-22
2025-11-14 16:49:52,645 - INFO - Finished converting document 4_2023-08-22 in 0.05 sec.


Converted 'data\edgar_documents\IBM\4_2023-07-05' --> 'data\processed_data\IBM\4_2023-07-05.md'
Converted 'data\edgar_documents\IBM\4_2023-08-10' --> 'data\processed_data\IBM\4_2023-08-10.md'


2025-11-14 16:49:52,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:52,697 - INFO - Going to convert document batch...
2025-11-14 16:49:52,698 - INFO - Processing document 4_2023-10-03
2025-11-14 16:49:52,734 - INFO - Finished converting document 4_2023-10-03 in 0.06 sec.


Converted 'data\edgar_documents\IBM\4_2023-08-22' --> 'data\processed_data\IBM\4_2023-08-22.md'
Converted 'data\edgar_documents\IBM\4_2023-10-03' --> 'data\processed_data\IBM\4_2023-10-03.md'


2025-11-14 16:49:52,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:52,901 - INFO - Going to convert document batch...
2025-11-14 16:49:52,903 - INFO - Processing document 4_2023-11-13
2025-11-14 16:49:52,929 - INFO - Finished converting document 4_2023-11-13 in 0.16 sec.
2025-11-14 16:49:52,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:53,013 - INFO - Going to convert document batch...
2025-11-14 16:49:53,014 - INFO - Processing document 4_2023-12-13
2025-11-14 16:49:53,044 - INFO - Finished converting document 4_2023-12-13 in 0.09 sec.
2025-11-14 16:49:53,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:53,101 - INFO - Going to convert document batch...
2025-11-14 16:49:53,102 - INFO - Processing document 4_2023-12-29
2025-11-14 16:49:53,128 - INFO - Finished converting document 4_2023-12-29 in 0.06 sec.


Converted 'data\edgar_documents\IBM\4_2023-11-13' --> 'data\processed_data\IBM\4_2023-11-13.md'
Converted 'data\edgar_documents\IBM\4_2023-12-13' --> 'data\processed_data\IBM\4_2023-12-13.md'


2025-11-14 16:49:53,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:53,181 - INFO - Going to convert document batch...
2025-11-14 16:49:53,182 - INFO - Processing document 4_2024-01-03
2025-11-14 16:49:53,224 - INFO - Finished converting document 4_2024-01-03 in 0.06 sec.
2025-11-14 16:49:53,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:53,312 - INFO - Going to convert document batch...
2025-11-14 16:49:53,313 - INFO - Processing document 4_2024-01-05


Converted 'data\edgar_documents\IBM\4_2023-12-29' --> 'data\processed_data\IBM\4_2023-12-29.md'
Converted 'data\edgar_documents\IBM\4_2024-01-03' --> 'data\processed_data\IBM\4_2024-01-03.md'


2025-11-14 16:49:53,350 - INFO - Finished converting document 4_2024-01-05 in 0.08 sec.
2025-11-14 16:49:53,426 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:49:53,427 - ERROR - Input document 4_2024-01-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:49:53,429 - INFO - Going to convert document batch...
2025-11-14 16:49:53,456 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:49:53,458 - ERROR - Input document 4_2024-01-31 with forma

Converted 'data\edgar_documents\IBM\4_2024-01-05' --> 'data\processed_data\IBM\4_2024-01-05.md'
Error processing data\edgar_documents\IBM\4_2024-01-29: File format not allowed: data\edgar_documents\IBM\4_2024-01-29
Error processing data\edgar_documents\IBM\4_2024-01-31: File format not allowed: data\edgar_documents\IBM\4_2024-01-31


2025-11-14 16:49:53,617 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:53,630 - INFO - Going to convert document batch...
2025-11-14 16:49:53,631 - INFO - Processing document 4_2024-02-12
2025-11-14 16:49:53,657 - INFO - Finished converting document 4_2024-02-12 in 0.06 sec.
2025-11-14 16:49:53,700 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:53,714 - INFO - Going to convert document batch...
2025-11-14 16:49:53,714 - INFO - Processing document 4_2024-02-13
2025-11-14 16:49:53,747 - INFO - Finished converting document 4_2024-02-13 in 0.06 sec.


Converted 'data\edgar_documents\IBM\4_2024-02-05' --> 'data\processed_data\IBM\4_2024-02-05.md'
Converted 'data\edgar_documents\IBM\4_2024-02-12' --> 'data\processed_data\IBM\4_2024-02-12.md'


2025-11-14 16:49:53,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:53,808 - INFO - Going to convert document batch...
2025-11-14 16:49:53,810 - INFO - Processing document 4_2024-02-23
2025-11-14 16:49:53,897 - INFO - Finished converting document 4_2024-02-23 in 0.11 sec.


Converted 'data\edgar_documents\IBM\4_2024-02-13' --> 'data\processed_data\IBM\4_2024-02-13.md'
Converted 'data\edgar_documents\IBM\4_2024-02-23' --> 'data\processed_data\IBM\4_2024-02-23.md'


2025-11-14 16:49:54,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:54,030 - INFO - Going to convert document batch...
2025-11-14 16:49:54,032 - INFO - Processing document 4_2024-04-01
2025-11-14 16:49:54,075 - INFO - Finished converting document 4_2024-04-01 in 0.11 sec.
2025-11-14 16:49:54,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:54,167 - INFO - Going to convert document batch...
2025-11-14 16:49:54,168 - INFO - Processing document 4_2024-04-04
2025-11-14 16:49:54,214 - INFO - Finished converting document 4_2024-04-04 in 0.11 sec.


Converted 'data\edgar_documents\IBM\4_2024-04-01' --> 'data\processed_data\IBM\4_2024-04-01.md'
Converted 'data\edgar_documents\IBM\4_2024-04-04' --> 'data\processed_data\IBM\4_2024-04-04.md'


2025-11-14 16:49:54,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:54,372 - INFO - Going to convert document batch...
2025-11-14 16:49:54,374 - INFO - Processing document 4_2024-05-10
2025-11-14 16:49:54,413 - INFO - Finished converting document 4_2024-05-10 in 0.16 sec.
2025-11-14 16:49:54,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:54,502 - INFO - Going to convert document batch...
2025-11-14 16:49:54,503 - INFO - Processing document 4_2024-06-11
2025-11-14 16:49:54,560 - INFO - Finished converting document 4_2024-06-11 in 0.11 sec.


Converted 'data\edgar_documents\IBM\4_2024-05-10' --> 'data\processed_data\IBM\4_2024-05-10.md'
Converted 'data\edgar_documents\IBM\4_2024-06-11' --> 'data\processed_data\IBM\4_2024-06-11.md'


2025-11-14 16:49:54,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:54,695 - INFO - Going to convert document batch...
2025-11-14 16:49:54,697 - INFO - Processing document 4_2024-07-02
2025-11-14 16:49:54,727 - INFO - Finished converting document 4_2024-07-02 in 0.08 sec.
2025-11-14 16:49:54,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:54,834 - INFO - Going to convert document batch...
2025-11-14 16:49:54,835 - INFO - Processing document 4_2024-07-03
2025-11-14 16:49:54,897 - INFO - Finished converting document 4_2024-07-03 in 0.12 sec.


Converted 'data\edgar_documents\IBM\4_2024-07-02' --> 'data\processed_data\IBM\4_2024-07-02.md'
Converted 'data\edgar_documents\IBM\4_2024-07-03' --> 'data\processed_data\IBM\4_2024-07-03.md'


2025-11-14 16:49:54,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:54,990 - INFO - Going to convert document batch...
2025-11-14 16:49:54,991 - INFO - Processing document 4_2024-08-12
2025-11-14 16:49:55,026 - INFO - Finished converting document 4_2024-08-12 in 0.09 sec.
2025-11-14 16:49:55,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:55,083 - INFO - Going to convert document batch...
2025-11-14 16:49:55,084 - INFO - Processing document 4_2024-09-03
2025-11-14 16:49:55,114 - INFO - Finished converting document 4_2024-09-03 in 0.05 sec.
2025-11-14 16:49:55,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:55,184 - INFO - Going to convert document batch...
2025-11-14 16:49:55,185 - INFO - Processing document 4_2024-10-01
2025-11-14 16:49:55,211 - INFO - Finished converting document 4_2024-10-01 in 0.06 sec.
2025-11-14 16:49:55,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\4_2024-08-12' --> 'data\processed_data\IBM\4_2024-08-12.md'
Converted 'data\edgar_documents\IBM\4_2024-09-03' --> 'data\processed_data\IBM\4_2024-09-03.md'
Converted 'data\edgar_documents\IBM\4_2024-10-01' --> 'data\processed_data\IBM\4_2024-10-01.md'


2025-11-14 16:49:55,258 - INFO - Going to convert document batch...
2025-11-14 16:49:55,260 - INFO - Processing document 4_2024-11-08
2025-11-14 16:49:55,282 - INFO - Finished converting document 4_2024-11-08 in 0.05 sec.
2025-11-14 16:49:55,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:55,357 - INFO - Going to convert document batch...
2025-11-14 16:49:55,358 - INFO - Processing document 4_2024-11-13
2025-11-14 16:49:55,380 - INFO - Finished converting document 4_2024-11-13 in 0.05 sec.
2025-11-14 16:49:55,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:55,436 - INFO - Going to convert document batch...
2025-11-14 16:49:55,438 - INFO - Processing document 4_2025-01-02
2025-11-14 16:49:55,466 - INFO - Finished converting document 4_2025-01-02 in 0.06 sec.
2025-11-14 16:49:55,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:55,513 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\IBM\4_2024-11-08' --> 'data\processed_data\IBM\4_2024-11-08.md'
Converted 'data\edgar_documents\IBM\4_2024-11-13' --> 'data\processed_data\IBM\4_2024-11-13.md'
Converted 'data\edgar_documents\IBM\4_2025-01-02' --> 'data\processed_data\IBM\4_2025-01-02.md'


2025-11-14 16:49:55,514 - INFO - Processing document 4_2025-01-06
2025-11-14 16:49:55,539 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 16:49:55,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:55,674 - INFO - Going to convert document batch...
2025-11-14 16:49:55,680 - INFO - Processing document 4_2025-02-03
2025-11-14 16:49:55,704 - INFO - Finished converting document 4_2025-02-03 in 0.12 sec.
2025-11-14 16:49:55,793 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\IBM\4_2025-01-06' --> 'data\processed_data\IBM\4_2025-01-06.md'
Converted 'data\edgar_documents\IBM\4_2025-02-03' --> 'data\processed_data\IBM\4_2025-02-03.md'


2025-11-14 16:49:55,794 - ERROR - Input document 4_2025-02-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:49:55,796 - INFO - Going to convert document batch...
2025-11-14 16:49:55,829 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:49:55,829 - ERROR - Input document 4_2025-02-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\IBM\4_2025-02-05: File format not allowed: data\edgar_documents\IBM\4_2025-02-05
Error processing data\edgar_documents\IBM\4_2025-02-06: File format not allowed: data\edgar_documents\IBM\4_2025-02-06
Converted 'data\edgar_documents\IBM\4_2025-02-11' --> 'data\processed_data\IBM\4_2025-02-11.md'


2025-11-14 16:49:56,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:56,052 - INFO - Going to convert document batch...
2025-11-14 16:49:56,053 - INFO - Processing document 4_2025-02-19
2025-11-14 16:49:56,083 - INFO - Finished converting document 4_2025-02-19 in 0.06 sec.
2025-11-14 16:49:56,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:56,150 - INFO - Going to convert document batch...
2025-11-14 16:49:56,151 - INFO - Processing document 4_2025-02-25
2025-11-14 16:49:56,193 - INFO - Finished converting document 4_2025-02-25 in 0.08 sec.


Converted 'data\edgar_documents\IBM\4_2025-02-12' --> 'data\processed_data\IBM\4_2025-02-12.md'
Converted 'data\edgar_documents\IBM\4_2025-02-19' --> 'data\processed_data\IBM\4_2025-02-19.md'


2025-11-14 16:49:56,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:56,247 - INFO - Going to convert document batch...
2025-11-14 16:49:56,248 - INFO - Processing document 4_2025-02-28
2025-11-14 16:49:56,277 - INFO - Finished converting document 4_2025-02-28 in 0.06 sec.
2025-11-14 16:49:56,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:56,376 - INFO - Going to convert document batch...
2025-11-14 16:49:56,377 - INFO - Processing document 4_2025-03-03
2025-11-14 16:49:56,405 - INFO - Finished converting document 4_2025-03-03 in 0.11 sec.


Converted 'data\edgar_documents\IBM\4_2025-02-25' --> 'data\processed_data\IBM\4_2025-02-25.md'
Converted 'data\edgar_documents\IBM\4_2025-02-28' --> 'data\processed_data\IBM\4_2025-02-28.md'


2025-11-14 16:49:56,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:56,459 - INFO - Going to convert document batch...
2025-11-14 16:49:56,460 - INFO - Processing document 4_2025-03-06
2025-11-14 16:49:56,482 - INFO - Finished converting document 4_2025-03-06 in 0.06 sec.
2025-11-14 16:49:56,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:56,533 - INFO - Going to convert document batch...
2025-11-14 16:49:56,534 - INFO - Processing document 4_2025-04-01
2025-11-14 16:49:56,564 - INFO - Finished converting document 4_2025-04-01 in 0.05 sec.
2025-11-14 16:49:56,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\4_2025-03-03' --> 'data\processed_data\IBM\4_2025-03-03.md'
Converted 'data\edgar_documents\IBM\4_2025-03-06' --> 'data\processed_data\IBM\4_2025-03-06.md'
Converted 'data\edgar_documents\IBM\4_2025-04-01' --> 'data\processed_data\IBM\4_2025-04-01.md'


2025-11-14 16:49:56,626 - INFO - Going to convert document batch...
2025-11-14 16:49:56,627 - INFO - Processing document 4_2025-06-09
2025-11-14 16:49:56,669 - INFO - Finished converting document 4_2025-06-09 in 0.08 sec.
2025-11-14 16:49:56,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:56,722 - INFO - Going to convert document batch...
2025-11-14 16:49:56,724 - INFO - Processing document 4_2025-07-01
2025-11-14 16:49:56,746 - INFO - Finished converting document 4_2025-07-01 in 0.05 sec.
2025-11-14 16:49:56,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:56,811 - INFO - Going to convert document batch...
2025-11-14 16:49:56,813 - INFO - Processing document 4_2025-07-02


Converted 'data\edgar_documents\IBM\4_2025-06-09' --> 'data\processed_data\IBM\4_2025-06-09.md'
Converted 'data\edgar_documents\IBM\4_2025-07-01' --> 'data\processed_data\IBM\4_2025-07-01.md'


2025-11-14 16:49:56,938 - INFO - Finished converting document 4_2025-07-02 in 0.17 sec.
2025-11-14 16:49:57,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:57,024 - INFO - Going to convert document batch...
2025-11-14 16:49:57,025 - INFO - Processing document 4_2025-09-02
2025-11-14 16:49:57,050 - INFO - Finished converting document 4_2025-09-02 in 0.08 sec.
2025-11-14 16:49:57,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:57,099 - INFO - Going to convert document batch...
2025-11-14 16:49:57,100 - INFO - Processing document 4_2025-10-01
2025-11-14 16:49:57,121 - INFO - Finished converting document 4_2025-10-01 in 0.05 sec.
2025-11-14 16:49:57,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\4_2025-07-02' --> 'data\processed_data\IBM\4_2025-07-02.md'
Converted 'data\edgar_documents\IBM\4_2025-09-02' --> 'data\processed_data\IBM\4_2025-09-02.md'
Converted 'data\edgar_documents\IBM\4_2025-10-01' --> 'data\processed_data\IBM\4_2025-10-01.md'


2025-11-14 16:49:57,178 - INFO - Going to convert document batch...
2025-11-14 16:49:57,179 - INFO - Processing document 4_2025-11-05
2025-11-14 16:49:57,200 - INFO - Finished converting document 4_2025-11-05 in 0.06 sec.
2025-11-14 16:49:57,251 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:57,264 - INFO - Going to convert document batch...
2025-11-14 16:49:57,265 - INFO - Processing document 4_2025-11-07
2025-11-14 16:49:57,286 - INFO - Finished converting document 4_2025-11-07 in 0.05 sec.
2025-11-14 16:49:57,343 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:57,371 - INFO - Going to convert document batch...
2025-11-14 16:49:57,372 - INFO - Processing document 8-K_2023-01-05
2025-11-14 16:49:57,410 - INFO - Finished converting document 8-K_2023-01-05 in 0.09 sec.


Converted 'data\edgar_documents\IBM\4_2025-11-05' --> 'data\processed_data\IBM\4_2025-11-05.md'
Converted 'data\edgar_documents\IBM\4_2025-11-07' --> 'data\processed_data\IBM\4_2025-11-07.md'


2025-11-14 16:49:57,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:57,523 - INFO - Going to convert document batch...
2025-11-14 16:49:57,524 - INFO - Processing document 8-K_2023-01-25
2025-11-14 16:49:57,577 - INFO - Finished converting document 8-K_2023-01-25 in 0.14 sec.


Converted 'data\edgar_documents\IBM\8-K_2023-01-05' --> 'data\processed_data\IBM\8-K_2023-01-05.md'


2025-11-14 16:49:57,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:57,771 - INFO - Going to convert document batch...
2025-11-14 16:49:57,772 - INFO - Processing document 8-K_2023-01-26
2025-11-14 16:49:57,820 - INFO - Finished converting document 8-K_2023-01-26 in 0.12 sec.
2025-11-14 16:49:57,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\8-K_2023-01-25' --> 'data\processed_data\IBM\8-K_2023-01-25.md'
Converted 'data\edgar_documents\IBM\8-K_2023-01-26' --> 'data\processed_data\IBM\8-K_2023-01-26.md'


2025-11-14 16:49:57,930 - INFO - Going to convert document batch...
2025-11-14 16:49:57,932 - INFO - Processing document 8-K_2023-02-03
2025-11-14 16:49:58,009 - INFO - Finished converting document 8-K_2023-02-03 in 0.16 sec.
2025-11-14 16:49:58,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:58,194 - INFO - Going to convert document batch...
2025-11-14 16:49:58,195 - INFO - Processing document 8-K_2023-04-19
2025-11-14 16:49:58,230 - INFO - Finished converting document 8-K_2023-04-19 in 0.09 sec.
2025-11-14 16:49:58,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:58,289 - INFO - Going to convert document batch...
2025-11-14 16:49:58,289 - INFO - Processing document 8-K_2023-04-20
2025-11-14 16:49:58,329 - INFO - Finished converting document 8-K_2023-04-20 in 0.08 sec.


Converted 'data\edgar_documents\IBM\8-K_2023-02-03' --> 'data\processed_data\IBM\8-K_2023-02-03.md'
Converted 'data\edgar_documents\IBM\8-K_2023-04-19' --> 'data\processed_data\IBM\8-K_2023-04-19.md'


2025-11-14 16:49:58,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:58,427 - INFO - Going to convert document batch...
2025-11-14 16:49:58,428 - INFO - Processing document 8-K_2023-04-28
2025-11-14 16:49:58,508 - INFO - Finished converting document 8-K_2023-04-28 in 0.16 sec.


Converted 'data\edgar_documents\IBM\8-K_2023-04-20' --> 'data\processed_data\IBM\8-K_2023-04-20.md'
Converted 'data\edgar_documents\IBM\8-K_2023-04-28' --> 'data\processed_data\IBM\8-K_2023-04-28.md'


2025-11-14 16:49:58,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:58,640 - INFO - Going to convert document batch...
2025-11-14 16:49:58,641 - INFO - Processing document 8-K_2023-06-16
2025-11-14 16:49:58,718 - INFO - Finished converting document 8-K_2023-06-16 in 0.17 sec.
2025-11-14 16:49:58,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:58,804 - INFO - Going to convert document batch...
2025-11-14 16:49:58,805 - INFO - Processing document 8-K_2023-07-19
2025-11-14 16:49:58,856 - INFO - Finished converting document 8-K_2023-07-19 in 0.11 sec.
2025-11-14 16:49:58,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:58,935 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\IBM\8-K_2023-06-16' --> 'data\processed_data\IBM\8-K_2023-06-16.md'
Converted 'data\edgar_documents\IBM\8-K_2023-07-19' --> 'data\processed_data\IBM\8-K_2023-07-19.md'


2025-11-14 16:49:58,937 - INFO - Processing document 8-K_2023-07-20
2025-11-14 16:49:58,994 - INFO - Finished converting document 8-K_2023-07-20 in 0.11 sec.
2025-11-14 16:49:59,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\8-K_2023-07-20' --> 'data\processed_data\IBM\8-K_2023-07-20.md'


2025-11-14 16:49:59,784 - INFO - Going to convert document batch...
2025-11-14 16:49:59,786 - INFO - Processing document 8-K_2023-07-31
2025-11-14 16:49:59,858 - INFO - Finished converting document 8-K_2023-07-31 in 0.84 sec.
2025-11-14 16:49:59,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:49:59,986 - INFO - Going to convert document batch...
2025-11-14 16:49:59,987 - INFO - Processing document 8-K_2023-10-25
2025-11-14 16:50:00,032 - INFO - Finished converting document 8-K_2023-10-25 in 0.11 sec.
2025-11-14 16:50:00,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\8-K_2023-07-31' --> 'data\processed_data\IBM\8-K_2023-07-31.md'
Converted 'data\edgar_documents\IBM\8-K_2023-10-25' --> 'data\processed_data\IBM\8-K_2023-10-25.md'


2025-11-14 16:50:00,158 - INFO - Going to convert document batch...
2025-11-14 16:50:00,158 - INFO - Processing document 8-K_2023-10-26
2025-11-14 16:50:00,198 - INFO - Finished converting document 8-K_2023-10-26 in 0.16 sec.
2025-11-14 16:50:00,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:00,292 - INFO - Going to convert document batch...
2025-11-14 16:50:00,293 - INFO - Processing document 8-K_2023-12-12
2025-11-14 16:50:00,340 - INFO - Finished converting document 8-K_2023-12-12 in 0.12 sec.


Converted 'data\edgar_documents\IBM\8-K_2023-10-26' --> 'data\processed_data\IBM\8-K_2023-10-26.md'
Converted 'data\edgar_documents\IBM\8-K_2023-12-12' --> 'data\processed_data\IBM\8-K_2023-12-12.md'


2025-11-14 16:50:00,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:00,482 - INFO - Going to convert document batch...
2025-11-14 16:50:00,483 - INFO - Processing document 8-K_2024-01-24
2025-11-14 16:50:00,537 - INFO - Finished converting document 8-K_2024-01-24 in 0.16 sec.
2025-11-14 16:50:00,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:00,611 - INFO - Going to convert document batch...
2025-11-14 16:50:00,612 - INFO - Processing document 8-K_2024-01-25
2025-11-14 16:50:00,648 - INFO - Finished converting document 8-K_2024-01-25 in 0.08 sec.
2025-11-14 16:50:00,680 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:50:00,681 - ERROR - Input document 8-K_2024-02-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciid

Converted 'data\edgar_documents\IBM\8-K_2024-01-24' --> 'data\processed_data\IBM\8-K_2024-01-24.md'
Converted 'data\edgar_documents\IBM\8-K_2024-01-25' --> 'data\processed_data\IBM\8-K_2024-01-25.md'
Error processing data\edgar_documents\IBM\8-K_2024-02-01: File format not allowed: data\edgar_documents\IBM\8-K_2024-02-01


2025-11-14 16:50:00,807 - INFO - Finished converting document 8-K_2024-02-02 in 0.11 sec.
2025-11-14 16:50:00,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:00,948 - INFO - Going to convert document batch...
2025-11-14 16:50:00,949 - INFO - Processing document 8-K_2024-02-26
2025-11-14 16:50:00,996 - INFO - Finished converting document 8-K_2024-02-26 in 0.14 sec.


Converted 'data\edgar_documents\IBM\8-K_2024-02-02' --> 'data\processed_data\IBM\8-K_2024-02-02.md'
Converted 'data\edgar_documents\IBM\8-K_2024-02-26' --> 'data\processed_data\IBM\8-K_2024-02-26.md'


2025-11-14 16:50:01,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:01,123 - INFO - Going to convert document batch...
2025-11-14 16:50:01,125 - INFO - Processing document 8-K_2024-03-18
2025-11-14 16:50:01,276 - INFO - Finished converting document 8-K_2024-03-18 in 0.25 sec.
2025-11-14 16:50:01,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:01,358 - INFO - Going to convert document batch...
2025-11-14 16:50:01,360 - INFO - Processing document 8-K_2024-04-24
2025-11-14 16:50:01,418 - INFO - Finished converting document 8-K_2024-04-24 in 0.11 sec.
2025-11-14 16:50:01,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\8-K_2024-03-18' --> 'data\processed_data\IBM\8-K_2024-03-18.md'
Converted 'data\edgar_documents\IBM\8-K_2024-04-24' --> 'data\processed_data\IBM\8-K_2024-04-24.md'


2025-11-14 16:50:01,523 - INFO - Going to convert document batch...
2025-11-14 16:50:01,524 - INFO - Processing document 8-K_2024-04-25
2025-11-14 16:50:01,567 - INFO - Finished converting document 8-K_2024-04-25 in 0.12 sec.
2025-11-14 16:50:01,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:01,677 - INFO - Going to convert document batch...
2025-11-14 16:50:01,678 - INFO - Processing document 8-K_2024-05-03
2025-11-14 16:50:01,751 - INFO - Finished converting document 8-K_2024-05-03 in 0.17 sec.


Converted 'data\edgar_documents\IBM\8-K_2024-04-25' --> 'data\processed_data\IBM\8-K_2024-04-25.md'


2025-11-14 16:50:01,842 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:50:01,843 - ERROR - Input document 8-K_2024-06-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:50:01,844 - INFO - Going to convert document batch...
2025-11-14 16:50:01,861 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:01,880 - INFO - Going to convert document batch...
2025-11-14 16:50:01,880 - INFO - Processing document 8-K_2024-07

Converted 'data\edgar_documents\IBM\8-K_2024-05-03' --> 'data\processed_data\IBM\8-K_2024-05-03.md'
Error processing data\edgar_documents\IBM\8-K_2024-06-21: File format not allowed: data\edgar_documents\IBM\8-K_2024-06-21


2025-11-14 16:50:02,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:02,102 - INFO - Going to convert document batch...
2025-11-14 16:50:02,103 - INFO - Processing document 8-K_2024-07-25
2025-11-14 16:50:02,142 - INFO - Finished converting document 8-K_2024-07-25 in 0.12 sec.
2025-11-14 16:50:02,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:02,215 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\IBM\8-K_2024-07-24' --> 'data\processed_data\IBM\8-K_2024-07-24.md'
Converted 'data\edgar_documents\IBM\8-K_2024-07-25' --> 'data\processed_data\IBM\8-K_2024-07-25.md'


2025-11-14 16:50:02,216 - INFO - Processing document 8-K_2024-09-11
2025-11-14 16:50:02,272 - INFO - Finished converting document 8-K_2024-09-11 in 0.11 sec.
2025-11-14 16:50:02,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:02,392 - INFO - Going to convert document batch...
2025-11-14 16:50:02,393 - INFO - Processing document 8-K_2024-10-23
2025-11-14 16:50:02,429 - INFO - Finished converting document 8-K_2024-10-23 in 0.12 sec.


Converted 'data\edgar_documents\IBM\8-K_2024-09-11' --> 'data\processed_data\IBM\8-K_2024-09-11.md'
Converted 'data\edgar_documents\IBM\8-K_2024-10-23' --> 'data\processed_data\IBM\8-K_2024-10-23.md'


2025-11-14 16:50:02,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:02,800 - INFO - Going to convert document batch...
2025-11-14 16:50:02,805 - INFO - Processing document 8-K_2024-10-24
2025-11-14 16:50:02,844 - INFO - Finished converting document 8-K_2024-10-24 in 0.39 sec.
2025-11-14 16:50:02,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:02,945 - INFO - Going to convert document batch...
2025-11-14 16:50:02,945 - INFO - Processing document 8-K_2024-12-09
2025-11-14 16:50:02,978 - INFO - Finished converting document 8-K_2024-12-09 in 0.08 sec.
2025-11-14 16:50:03,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:03,039 - INFO - Going to convert document batch...
2025-11-14 16:50:03,041 - INFO - Processing document 8-K_2025-01-29
2025-11-14 16:50:03,072 - INFO - Finished converting document 8-K_2025-01-29 in 0.06 sec.


Converted 'data\edgar_documents\IBM\8-K_2024-10-24' --> 'data\processed_data\IBM\8-K_2024-10-24.md'
Converted 'data\edgar_documents\IBM\8-K_2024-12-09' --> 'data\processed_data\IBM\8-K_2024-12-09.md'


2025-11-14 16:50:03,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:03,217 - INFO - Going to convert document batch...
2025-11-14 16:50:03,219 - INFO - Processing document 8-K_2025-01-30
2025-11-14 16:50:03,269 - INFO - Finished converting document 8-K_2025-01-30 in 0.19 sec.


Converted 'data\edgar_documents\IBM\8-K_2025-01-29' --> 'data\processed_data\IBM\8-K_2025-01-29.md'


2025-11-14 16:50:03,309 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:03,332 - INFO - Going to convert document batch...
2025-11-14 16:50:03,333 - INFO - Processing document 8-K_2025-02-04
2025-11-14 16:50:03,374 - INFO - Finished converting document 8-K_2025-02-04 in 0.08 sec.
2025-11-14 16:50:03,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:03,464 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\IBM\8-K_2025-01-30' --> 'data\processed_data\IBM\8-K_2025-01-30.md'
Converted 'data\edgar_documents\IBM\8-K_2025-02-04' --> 'data\processed_data\IBM\8-K_2025-02-04.md'


2025-11-14 16:50:03,465 - INFO - Processing document 8-K_2025-02-07
2025-11-14 16:50:03,563 - INFO - Finished converting document 8-K_2025-02-07 in 0.16 sec.
2025-11-14 16:50:03,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:03,679 - INFO - Going to convert document batch...
2025-11-14 16:50:03,679 - INFO - Processing document 8-K_2025-03-12


Converted 'data\edgar_documents\IBM\8-K_2025-02-07' --> 'data\processed_data\IBM\8-K_2025-02-07.md'


2025-11-14 16:50:03,952 - INFO - Finished converting document 8-K_2025-03-12 in 0.36 sec.
2025-11-14 16:50:03,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:04,024 - INFO - Going to convert document batch...
2025-11-14 16:50:04,025 - INFO - Processing document 8-K_2025-04-23
2025-11-14 16:50:04,061 - INFO - Finished converting document 8-K_2025-04-23 in 0.09 sec.
2025-11-14 16:50:04,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:04,114 - INFO - Going to convert document batch...
2025-11-14 16:50:04,115 - INFO - Processing document 8-K_2025-04-24
2025-11-14 16:50:04,150 - INFO - Finished converting document 8-K_2025-04-24 in 0.06 sec.


Converted 'data\edgar_documents\IBM\8-K_2025-03-12' --> 'data\processed_data\IBM\8-K_2025-03-12.md'
Converted 'data\edgar_documents\IBM\8-K_2025-04-23' --> 'data\processed_data\IBM\8-K_2025-04-23.md'
Converted 'data\edgar_documents\IBM\8-K_2025-04-24' --> 'data\processed_data\IBM\8-K_2025-04-24.md'


2025-11-14 16:50:04,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:04,227 - INFO - Going to convert document batch...
2025-11-14 16:50:04,228 - INFO - Processing document 8-K_2025-04-29
2025-11-14 16:50:04,263 - INFO - Finished converting document 8-K_2025-04-29 in 0.09 sec.
2025-11-14 16:50:04,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:04,345 - INFO - Going to convert document batch...
2025-11-14 16:50:04,346 - INFO - Processing document 8-K_2025-05-02
2025-11-14 16:50:04,416 - INFO - Finished converting document 8-K_2025-05-02 in 0.14 sec.


Converted 'data\edgar_documents\IBM\8-K_2025-04-29' --> 'data\processed_data\IBM\8-K_2025-04-29.md'
Converted 'data\edgar_documents\IBM\8-K_2025-05-02' --> 'data\processed_data\IBM\8-K_2025-05-02.md'


2025-11-14 16:50:04,528 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:50:04,529 - ERROR - Input document 8-K_2025-06-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:50:04,530 - INFO - Going to convert document batch...
2025-11-14 16:50:04,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:04,571 - INFO - Going to convert document batch...
2025-11-14 16:50:04,571 - INFO - Processing document 8-K_2025-07

Error processing data\edgar_documents\IBM\8-K_2025-06-20: File format not allowed: data\edgar_documents\IBM\8-K_2025-06-20
Converted 'data\edgar_documents\IBM\8-K_2025-07-23' --> 'data\processed_data\IBM\8-K_2025-07-23.md'


2025-11-14 16:50:04,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:50:04,792 - INFO - Going to convert document batch...
2025-11-14 16:50:04,794 - INFO - Processing document 8-K_2025-10-22
2025-11-14 16:50:04,844 - INFO - Finished converting document 8-K_2025-10-22 in 0.09 sec.
2025-11-14 16:50:04,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\IBM\8-K_2025-07-24' --> 'data\processed_data\IBM\8-K_2025-07-24.md'
Converted 'data\edgar_documents\IBM\8-K_2025-10-22' --> 'data\processed_data\IBM\8-K_2025-10-22.md'


2025-11-14 16:50:04,974 - INFO - Going to convert document batch...
2025-11-14 16:50:04,975 - INFO - Processing document 8-K_2025-10-23
2025-11-14 16:50:05,018 - INFO - Finished converting document 8-K_2025-10-23 in 0.14 sec.
2025-11-14 16:50:05,141 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:50:05,142 - ERROR - Input document DEF-14A_2023-03-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:50:05,146 - INFO - Going to convert 

Converted 'data\edgar_documents\IBM\8-K_2025-10-23' --> 'data\processed_data\IBM\8-K_2025-10-23.md'
Error processing data\edgar_documents\IBM\DEF-14A_2023-03-06: File format not allowed: data\edgar_documents\IBM\DEF-14A_2023-03-06


2025-11-14 16:50:06,374 - INFO - Going to convert document batch...
2025-11-14 16:50:06,377 - INFO - Processing document DEF-14A_2024-03-11
2025-11-14 16:50:15,694 - INFO - Finished converting document DEF-14A_2024-03-11 in 10.55 sec.
2025-11-14 16:50:16,969 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\IBM\DEF-14A_2024-03-11' --> 'data\processed_data\IBM\DEF-14A_2024-03-11.md'


2025-11-14 16:50:16,970 - ERROR - Input document DEF-14A_2025-03-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:50:16,974 - INFO - Going to convert document batch...
2025-11-14 16:50:17,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\IBM\DEF-14A_2025-03-10: File format not allowed: data\edgar_documents\IBM\DEF-14A_2025-03-10
Processed 103 new files. Errors: 13
Found 133 files to process in data\edgar_documents\INTC


2025-11-14 16:50:18,209 - INFO - Going to convert document batch...
2025-11-14 16:50:18,209 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:50:18,211 - INFO - Processing document 10-K_2023-01-27
2025-11-14 16:50:22,042 - INFO - Finished converting document 10-K_2023-01-27 in 5.05 sec.
2025-11-14 16:50:23,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-K_2023-01-27' --> 'data\processed_data\INTC\10-K_2023-01-27.md'


2025-11-14 16:50:25,005 - INFO - Going to convert document batch...
2025-11-14 16:50:25,006 - INFO - Processing document 10-K_2024-01-26
2025-11-14 16:50:28,301 - INFO - Finished converting document 10-K_2024-01-26 in 5.03 sec.
2025-11-14 16:50:29,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-K_2024-01-26' --> 'data\processed_data\INTC\10-K_2024-01-26.md'


2025-11-14 16:50:31,555 - INFO - Going to convert document batch...
2025-11-14 16:50:31,556 - INFO - Processing document 10-K_2025-01-31
2025-11-14 16:50:34,717 - INFO - Finished converting document 10-K_2025-01-31 in 4.95 sec.
2025-11-14 16:50:35,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-K_2025-01-31' --> 'data\processed_data\INTC\10-K_2025-01-31.md'


2025-11-14 16:50:36,492 - INFO - Going to convert document batch...
2025-11-14 16:50:36,493 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 16:50:37,435 - INFO - Finished converting document 10-Q_2023-04-28 in 1.67 sec.
2025-11-14 16:50:38,108 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-Q_2023-04-28' --> 'data\processed_data\INTC\10-Q_2023-04-28.md'


2025-11-14 16:50:39,331 - INFO - Going to convert document batch...
2025-11-14 16:50:39,331 - INFO - Processing document 10-Q_2023-07-28
2025-11-14 16:50:40,546 - INFO - Finished converting document 10-Q_2023-07-28 in 2.53 sec.
2025-11-14 16:50:41,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-Q_2023-07-28' --> 'data\processed_data\INTC\10-Q_2023-07-28.md'


2025-11-14 16:50:42,385 - INFO - Going to convert document batch...
2025-11-14 16:50:42,386 - INFO - Processing document 10-Q_2023-10-27
2025-11-14 16:50:43,533 - INFO - Finished converting document 10-Q_2023-10-27 in 2.22 sec.
2025-11-14 16:50:44,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-Q_2023-10-27' --> 'data\processed_data\INTC\10-Q_2023-10-27.md'


2025-11-14 16:50:44,989 - INFO - Going to convert document batch...
2025-11-14 16:50:44,990 - INFO - Processing document 10-Q_2024-04-26
2025-11-14 16:50:46,546 - INFO - Finished converting document 10-Q_2024-04-26 in 2.17 sec.
2025-11-14 16:50:47,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-Q_2024-04-26' --> 'data\processed_data\INTC\10-Q_2024-04-26.md'


2025-11-14 16:50:47,769 - INFO - Going to convert document batch...
2025-11-14 16:50:47,770 - INFO - Processing document 10-Q_2024-08-02
2025-11-14 16:50:49,108 - INFO - Finished converting document 10-Q_2024-08-02 in 1.95 sec.
2025-11-14 16:50:49,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-Q_2024-08-02' --> 'data\processed_data\INTC\10-Q_2024-08-02.md'


2025-11-14 16:50:51,038 - INFO - Going to convert document batch...
2025-11-14 16:50:51,038 - INFO - Processing document 10-Q_2024-11-01
2025-11-14 16:50:52,421 - INFO - Finished converting document 10-Q_2024-11-01 in 2.62 sec.
2025-11-14 16:50:53,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-Q_2024-11-01' --> 'data\processed_data\INTC\10-Q_2024-11-01.md'


2025-11-14 16:50:53,981 - INFO - Going to convert document batch...
2025-11-14 16:50:53,982 - INFO - Processing document 10-Q_2025-04-25
2025-11-14 16:50:54,890 - INFO - Finished converting document 10-Q_2025-04-25 in 1.77 sec.
2025-11-14 16:50:55,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-Q_2025-04-25' --> 'data\processed_data\INTC\10-Q_2025-04-25.md'


2025-11-14 16:50:56,153 - INFO - Going to convert document batch...
2025-11-14 16:50:56,154 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 16:50:57,297 - INFO - Finished converting document 10-Q_2025-07-24 in 1.67 sec.
2025-11-14 16:50:58,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-Q_2025-07-24' --> 'data\processed_data\INTC\10-Q_2025-07-24.md'


2025-11-14 16:50:59,054 - INFO - Going to convert document batch...
2025-11-14 16:50:59,055 - INFO - Processing document 10-Q_2025-11-06
2025-11-14 16:51:00,152 - INFO - Finished converting document 10-Q_2025-11-06 in 2.03 sec.
2025-11-14 16:51:01,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:01,193 - INFO - Going to convert document batch...
2025-11-14 16:51:01,194 - INFO - Processing document 4_2023-01-04
2025-11-14 16:51:01,216 - INFO - Finished converting document 4_2023-01-04 in 0.06 sec.
2025-11-14 16:51:01,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:01,269 - INFO - Going to convert document batch...
2025-11-14 16:51:01,270 - INFO - Processing document 4_2023-02-01
2025-11-14 16:51:01,297 - INFO - Finished converting document 4_2023-02-01 in 0.06 sec.
2025-11-14 16:51:01,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\10-Q_2025-11-06' --> 'data\processed_data\INTC\10-Q_2025-11-06.md'
Converted 'data\edgar_documents\INTC\4_2023-01-04' --> 'data\processed_data\INTC\4_2023-01-04.md'
Converted 'data\edgar_documents\INTC\4_2023-02-01' --> 'data\processed_data\INTC\4_2023-02-01.md'


2025-11-14 16:51:01,362 - INFO - Going to convert document batch...
2025-11-14 16:51:01,363 - INFO - Processing document 4_2023-02-02
2025-11-14 16:51:01,405 - INFO - Finished converting document 4_2023-02-02 in 0.09 sec.
2025-11-14 16:51:01,496 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:51:01,497 - ERROR - Input document 4_2023-02-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:51:01,500 - INFO - Going to convert document batch...
2025-11-14 16:51:01,520 - IN

Converted 'data\edgar_documents\INTC\4_2023-02-02' --> 'data\processed_data\INTC\4_2023-02-02.md'
Error processing data\edgar_documents\INTC\4_2023-02-07: File format not allowed: data\edgar_documents\INTC\4_2023-02-07
Error processing data\edgar_documents\INTC\4_2023-02-08: File format not allowed: data\edgar_documents\INTC\4_2023-02-08
Converted 'data\edgar_documents\INTC\4_2023-02-17' --> 'data\processed_data\INTC\4_2023-02-17.md'


2025-11-14 16:51:01,629 - INFO - Processing document 4_2023-02-23
2025-11-14 16:51:01,655 - INFO - Finished converting document 4_2023-02-23 in 0.06 sec.
2025-11-14 16:51:01,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:01,701 - INFO - Going to convert document batch...
2025-11-14 16:51:01,702 - INFO - Processing document 4_2023-02-24
2025-11-14 16:51:01,742 - INFO - Finished converting document 4_2023-02-24 in 0.06 sec.
2025-11-14 16:51:01,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:01,788 - INFO - Going to convert document batch...
2025-11-14 16:51:01,789 - INFO - Processing document 4_2023-03-24
2025-11-14 16:51:01,816 - INFO - Finished converting document 4_2023-03-24 in 0.05 sec.
2025-11-14 16:51:01,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\4_2023-02-23' --> 'data\processed_data\INTC\4_2023-02-23.md'
Converted 'data\edgar_documents\INTC\4_2023-02-24' --> 'data\processed_data\INTC\4_2023-02-24.md'
Converted 'data\edgar_documents\INTC\4_2023-03-24' --> 'data\processed_data\INTC\4_2023-03-24.md'


2025-11-14 16:51:01,869 - INFO - Going to convert document batch...
2025-11-14 16:51:01,870 - INFO - Processing document 4_2023-04-03
2025-11-14 16:51:01,895 - INFO - Finished converting document 4_2023-04-03 in 0.05 sec.
2025-11-14 16:51:01,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:01,977 - INFO - Going to convert document batch...
2025-11-14 16:51:01,978 - INFO - Processing document 4_2023-05-03
2025-11-14 16:51:02,002 - INFO - Finished converting document 4_2023-05-03 in 0.06 sec.
2025-11-14 16:51:02,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:02,053 - INFO - Going to convert document batch...
2025-11-14 16:51:02,054 - INFO - Processing document 4_2023-05-15
2025-11-14 16:51:02,076 - INFO - Finished converting document 4_2023-05-15 in 0.05 sec.
2025-11-14 16:51:02,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\4_2023-04-03' --> 'data\processed_data\INTC\4_2023-04-03.md'
Converted 'data\edgar_documents\INTC\4_2023-05-03' --> 'data\processed_data\INTC\4_2023-05-03.md'
Converted 'data\edgar_documents\INTC\4_2023-05-15' --> 'data\processed_data\INTC\4_2023-05-15.md'


2025-11-14 16:51:02,135 - INFO - Going to convert document batch...
2025-11-14 16:51:02,136 - INFO - Processing document 4_2023-05-17
2025-11-14 16:51:02,169 - INFO - Finished converting document 4_2023-05-17 in 0.06 sec.
2025-11-14 16:51:02,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:02,229 - INFO - Going to convert document batch...
2025-11-14 16:51:02,229 - INFO - Processing document 4_2023-06-01
2025-11-14 16:51:02,254 - INFO - Finished converting document 4_2023-06-01 in 0.05 sec.
2025-11-14 16:51:02,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:02,313 - INFO - Going to convert document batch...
2025-11-14 16:51:02,313 - INFO - Processing document 4_2023-06-14
2025-11-14 16:51:02,339 - INFO - Finished converting document 4_2023-06-14 in 0.06 sec.
2025-11-14 16:51:02,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:02,394 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTC\4_2023-05-17' --> 'data\processed_data\INTC\4_2023-05-17.md'
Converted 'data\edgar_documents\INTC\4_2023-06-01' --> 'data\processed_data\INTC\4_2023-06-01.md'
Converted 'data\edgar_documents\INTC\4_2023-06-14' --> 'data\processed_data\INTC\4_2023-06-14.md'


2025-11-14 16:51:02,397 - INFO - Processing document 4_2023-06-26
2025-11-14 16:51:02,432 - INFO - Finished converting document 4_2023-06-26 in 0.08 sec.
2025-11-14 16:51:02,614 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:02,631 - INFO - Going to convert document batch...
2025-11-14 16:51:02,632 - INFO - Processing document 4_2023-07-05
2025-11-14 16:51:02,667 - INFO - Finished converting document 4_2023-07-05 in 0.11 sec.
2025-11-14 16:51:02,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:02,732 - INFO - Going to convert document batch...
2025-11-14 16:51:02,734 - INFO - Processing document 4_2023-08-02


Converted 'data\edgar_documents\INTC\4_2023-06-26' --> 'data\processed_data\INTC\4_2023-06-26.md'
Converted 'data\edgar_documents\INTC\4_2023-07-05' --> 'data\processed_data\INTC\4_2023-07-05.md'


2025-11-14 16:51:03,212 - INFO - Finished converting document 4_2023-08-02 in 0.50 sec.
2025-11-14 16:51:03,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:03,306 - INFO - Going to convert document batch...
2025-11-14 16:51:03,307 - INFO - Processing document 4_2023-08-04
2025-11-14 16:51:03,336 - INFO - Finished converting document 4_2023-08-04 in 0.08 sec.
2025-11-14 16:51:03,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:03,385 - INFO - Going to convert document batch...
2025-11-14 16:51:03,386 - INFO - Processing document 4_2023-08-10
2025-11-14 16:51:03,405 - INFO - Finished converting document 4_2023-08-10 in 0.05 sec.
2025-11-14 16:51:03,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\4_2023-08-02' --> 'data\processed_data\INTC\4_2023-08-02.md'
Converted 'data\edgar_documents\INTC\4_2023-08-04' --> 'data\processed_data\INTC\4_2023-08-04.md'
Converted 'data\edgar_documents\INTC\4_2023-08-10' --> 'data\processed_data\INTC\4_2023-08-10.md'


2025-11-14 16:51:03,453 - INFO - Going to convert document batch...
2025-11-14 16:51:03,453 - INFO - Processing document 4_2023-08-17
2025-11-14 16:51:03,578 - INFO - Finished converting document 4_2023-08-17 in 0.16 sec.
2025-11-14 16:51:03,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:03,682 - INFO - Going to convert document batch...
2025-11-14 16:51:03,683 - INFO - Processing document 4_2023-08-23
2025-11-14 16:51:03,703 - INFO - Finished converting document 4_2023-08-23 in 0.08 sec.
2025-11-14 16:51:03,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:03,747 - INFO - Going to convert document batch...
2025-11-14 16:51:03,748 - INFO - Processing document 4_2023-09-01
2025-11-14 16:51:03,773 - INFO - Finished converting document 4_2023-09-01 in 0.05 sec.
2025-11-14 16:51:03,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\4_2023-08-17' --> 'data\processed_data\INTC\4_2023-08-17.md'
Converted 'data\edgar_documents\INTC\4_2023-08-23' --> 'data\processed_data\INTC\4_2023-08-23.md'
Converted 'data\edgar_documents\INTC\4_2023-09-01' --> 'data\processed_data\INTC\4_2023-09-01.md'


2025-11-14 16:51:03,841 - INFO - Going to convert document batch...
2025-11-14 16:51:03,842 - INFO - Processing document 4_2023-09-26
2025-11-14 16:51:03,878 - INFO - Finished converting document 4_2023-09-26 in 0.08 sec.
2025-11-14 16:51:03,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:03,993 - INFO - Going to convert document batch...
2025-11-14 16:51:03,994 - INFO - Processing document 4_2023-10-03
2025-11-14 16:51:04,013 - INFO - Finished converting document 4_2023-10-03 in 0.09 sec.
2025-11-14 16:51:04,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:04,066 - INFO - Going to convert document batch...
2025-11-14 16:51:04,067 - INFO - Processing document 4_2023-11-01
2025-11-14 16:51:04,088 - INFO - Finished converting document 4_2023-11-01 in 0.05 sec.


Converted 'data\edgar_documents\INTC\4_2023-09-26' --> 'data\processed_data\INTC\4_2023-09-26.md'
Converted 'data\edgar_documents\INTC\4_2023-10-03' --> 'data\processed_data\INTC\4_2023-10-03.md'
Converted 'data\edgar_documents\INTC\4_2023-11-01' --> 'data\processed_data\INTC\4_2023-11-01.md'


2025-11-14 16:51:04,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:04,139 - INFO - Going to convert document batch...
2025-11-14 16:51:04,140 - INFO - Processing document 4_2023-11-02
2025-11-14 16:51:04,174 - INFO - Finished converting document 4_2023-11-02 in 0.06 sec.
2025-11-14 16:51:04,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:04,227 - INFO - Going to convert document batch...
2025-11-14 16:51:04,227 - INFO - Processing document 4_2023-11-14
2025-11-14 16:51:04,247 - INFO - Finished converting document 4_2023-11-14 in 0.05 sec.
2025-11-14 16:51:04,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:04,299 - INFO - Going to convert document batch...
2025-11-14 16:51:04,300 - INFO - Processing document 4_2023-11-17
2025-11-14 16:51:04,327 - INFO - Finished converting document 4_2023-11-17 in 0.06 sec.
2025-11-14 16:51:04,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\INTC\4_2023-11-02' --> 'data\processed_data\INTC\4_2023-11-02.md'
Converted 'data\edgar_documents\INTC\4_2023-11-14' --> 'data\processed_data\INTC\4_2023-11-14.md'
Converted 'data\edgar_documents\INTC\4_2023-11-17' --> 'data\processed_data\INTC\4_2023-11-17.md'


2025-11-14 16:51:04,394 - INFO - Finished converting document 4_2023-12-04 in 0.05 sec.
2025-11-14 16:51:04,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:04,453 - INFO - Going to convert document batch...
2025-11-14 16:51:04,454 - INFO - Processing document 4_2023-12-05
2025-11-14 16:51:04,477 - INFO - Finished converting document 4_2023-12-05 in 0.05 sec.
2025-11-14 16:51:04,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:04,625 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTC\4_2023-12-04' --> 'data\processed_data\INTC\4_2023-12-04.md'
Converted 'data\edgar_documents\INTC\4_2023-12-05' --> 'data\processed_data\INTC\4_2023-12-05.md'


2025-11-14 16:51:04,627 - INFO - Processing document 4_2023-12-27
2025-11-14 16:51:04,668 - INFO - Finished converting document 4_2023-12-27 in 0.16 sec.
2025-11-14 16:51:04,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:04,723 - INFO - Going to convert document batch...
2025-11-14 16:51:04,724 - INFO - Processing document 4_2024-01-03
2025-11-14 16:51:04,744 - INFO - Finished converting document 4_2024-01-03 in 0.03 sec.
2025-11-14 16:51:04,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:04,822 - INFO - Going to convert document batch...
2025-11-14 16:51:04,823 - INFO - Processing document 4_2024-01-30
2025-11-14 16:51:04,855 - INFO - Finished converting document 4_2024-01-30 in 0.09 sec.


Converted 'data\edgar_documents\INTC\4_2023-12-27' --> 'data\processed_data\INTC\4_2023-12-27.md'
Converted 'data\edgar_documents\INTC\4_2024-01-03' --> 'data\processed_data\INTC\4_2024-01-03.md'
Converted 'data\edgar_documents\INTC\4_2024-01-30' --> 'data\processed_data\INTC\4_2024-01-30.md'


2025-11-14 16:51:04,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:04,966 - INFO - Going to convert document batch...
2025-11-14 16:51:04,967 - INFO - Processing document 4_2024-02-01
2025-11-14 16:51:04,999 - INFO - Finished converting document 4_2024-02-01 in 0.12 sec.
2025-11-14 16:51:05,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:05,154 - INFO - Going to convert document batch...
2025-11-14 16:51:05,155 - INFO - Processing document 4_2024-02-02
2025-11-14 16:51:05,188 - INFO - Finished converting document 4_2024-02-02 in 0.09 sec.
2025-11-14 16:51:05,232 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:51:05,233 - ERROR - Input document 4_2024-02-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\INTC\4_2024-02-01' --> 'data\processed_data\INTC\4_2024-02-01.md'
Converted 'data\edgar_documents\INTC\4_2024-02-02' --> 'data\processed_data\INTC\4_2024-02-02.md'
Error processing data\edgar_documents\INTC\4_2024-02-15: File format not allowed: data\edgar_documents\INTC\4_2024-02-15
Error processing data\edgar_documents\INTC\4_2024-02-16: File format not allowed: data\edgar_documents\INTC\4_2024-02-16


2025-11-14 16:51:05,290 - INFO - Processing document 4_2024-02-20
2025-11-14 16:51:05,327 - INFO - Finished converting document 4_2024-02-20 in 0.08 sec.


Converted 'data\edgar_documents\INTC\4_2024-02-20' --> 'data\processed_data\INTC\4_2024-02-20.md'


2025-11-14 16:51:05,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:05,692 - INFO - Going to convert document batch...
2025-11-14 16:51:05,693 - INFO - Processing document 4_2024-03-04
2025-11-14 16:51:05,722 - INFO - Finished converting document 4_2024-03-04 in 0.34 sec.
2025-11-14 16:51:05,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:05,778 - INFO - Going to convert document batch...
2025-11-14 16:51:05,779 - INFO - Processing document 4_2024-03-26
2025-11-14 16:51:05,806 - INFO - Finished converting document 4_2024-03-26 in 0.05 sec.
2025-11-14 16:51:05,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:05,854 - INFO - Going to convert document batch...
2025-11-14 16:51:05,856 - INFO - Processing document 4_2024-04-02
2025-11-14 16:51:05,877 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 16:51:05,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\INTC\4_2024-03-04' --> 'data\processed_data\INTC\4_2024-03-04.md'
Converted 'data\edgar_documents\INTC\4_2024-03-26' --> 'data\processed_data\INTC\4_2024-03-26.md'
Converted 'data\edgar_documents\INTC\4_2024-04-02' --> 'data\processed_data\INTC\4_2024-04-02.md'


2025-11-14 16:51:05,952 - INFO - Finished converting document 4_2024-05-01 in 0.05 sec.
2025-11-14 16:51:05,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,001 - INFO - Going to convert document batch...
2025-11-14 16:51:06,003 - INFO - Processing document 4_2024-05-02
2025-11-14 16:51:06,030 - INFO - Finished converting document 4_2024-05-02 in 0.06 sec.
2025-11-14 16:51:06,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,085 - INFO - Going to convert document batch...
2025-11-14 16:51:06,085 - INFO - Processing document 4_2024-05-09
2025-11-14 16:51:06,133 - INFO - Finished converting document 4_2024-05-09 in 0.08 sec.


Converted 'data\edgar_documents\INTC\4_2024-05-01' --> 'data\processed_data\INTC\4_2024-05-01.md'
Converted 'data\edgar_documents\INTC\4_2024-05-02' --> 'data\processed_data\INTC\4_2024-05-02.md'
Converted 'data\edgar_documents\INTC\4_2024-05-09' --> 'data\processed_data\INTC\4_2024-05-09.md'


2025-11-14 16:51:06,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,189 - INFO - Going to convert document batch...
2025-11-14 16:51:06,189 - INFO - Processing document 4_2024-05-10
2025-11-14 16:51:06,226 - INFO - Finished converting document 4_2024-05-10 in 0.06 sec.
2025-11-14 16:51:06,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,273 - INFO - Going to convert document batch...
2025-11-14 16:51:06,274 - INFO - Processing document 4_2024-06-03
2025-11-14 16:51:06,294 - INFO - Finished converting document 4_2024-06-03 in 0.05 sec.
2025-11-14 16:51:06,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,338 - INFO - Going to convert document batch...
2025-11-14 16:51:06,339 - INFO - Processing document 4_2024-07-02
2025-11-14 16:51:06,360 - INFO - Finished converting document 4_2024-07-02 in 0.05 sec.
2025-11-14 16:51:06,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\INTC\4_2024-05-10' --> 'data\processed_data\INTC\4_2024-05-10.md'
Converted 'data\edgar_documents\INTC\4_2024-06-03' --> 'data\processed_data\INTC\4_2024-06-03.md'
Converted 'data\edgar_documents\INTC\4_2024-07-02' --> 'data\processed_data\INTC\4_2024-07-02.md'


2025-11-14 16:51:06,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,488 - INFO - Going to convert document batch...
2025-11-14 16:51:06,489 - INFO - Processing document 4_2024-08-02
2025-11-14 16:51:06,512 - INFO - Finished converting document 4_2024-08-02 in 0.06 sec.
2025-11-14 16:51:06,558 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,576 - INFO - Going to convert document batch...
2025-11-14 16:51:06,577 - INFO - Processing document 4_2024-08-07
2025-11-14 16:51:06,607 - INFO - Finished converting document 4_2024-08-07 in 0.08 sec.
2025-11-14 16:51:06,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\4_2024-08-01' --> 'data\processed_data\INTC\4_2024-08-01.md'
Converted 'data\edgar_documents\INTC\4_2024-08-02' --> 'data\processed_data\INTC\4_2024-08-02.md'
Converted 'data\edgar_documents\INTC\4_2024-08-07' --> 'data\processed_data\INTC\4_2024-08-07.md'


2025-11-14 16:51:06,664 - INFO - Going to convert document batch...
2025-11-14 16:51:06,665 - INFO - Processing document 4_2024-09-04
2025-11-14 16:51:06,701 - INFO - Finished converting document 4_2024-09-04 in 0.08 sec.
2025-11-14 16:51:06,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,768 - INFO - Going to convert document batch...
2025-11-14 16:51:06,769 - INFO - Processing document 4_2024-10-01
2025-11-14 16:51:06,789 - INFO - Finished converting document 4_2024-10-01 in 0.05 sec.
2025-11-14 16:51:06,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,836 - INFO - Going to convert document batch...
2025-11-14 16:51:06,837 - INFO - Processing document 4_2024-11-01
2025-11-14 16:51:06,859 - INFO - Finished converting document 4_2024-11-01 in 0.05 sec.
2025-11-14 16:51:06,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:06,929 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTC\4_2024-09-04' --> 'data\processed_data\INTC\4_2024-09-04.md'
Converted 'data\edgar_documents\INTC\4_2024-10-01' --> 'data\processed_data\INTC\4_2024-10-01.md'
Converted 'data\edgar_documents\INTC\4_2024-11-01' --> 'data\processed_data\INTC\4_2024-11-01.md'


2025-11-14 16:51:06,931 - INFO - Processing document 4_2024-11-06
2025-11-14 16:51:06,958 - INFO - Finished converting document 4_2024-11-06 in 0.06 sec.
2025-11-14 16:51:07,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,021 - INFO - Going to convert document batch...
2025-11-14 16:51:07,022 - INFO - Processing document 4_2024-11-08
2025-11-14 16:51:07,040 - INFO - Finished converting document 4_2024-11-08 in 0.05 sec.
2025-11-14 16:51:07,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,088 - INFO - Going to convert document batch...
2025-11-14 16:51:07,089 - INFO - Processing document 4_2024-12-04
2025-11-14 16:51:07,109 - INFO - Finished converting document 4_2024-12-04 in 0.05 sec.
2025-11-14 16:51:07,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,173 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTC\4_2024-11-06' --> 'data\processed_data\INTC\4_2024-11-06.md'
Converted 'data\edgar_documents\INTC\4_2024-11-08' --> 'data\processed_data\INTC\4_2024-11-08.md'
Converted 'data\edgar_documents\INTC\4_2024-12-04' --> 'data\processed_data\INTC\4_2024-12-04.md'


2025-11-14 16:51:07,174 - INFO - Processing document 4_2024-12-05
2025-11-14 16:51:07,199 - INFO - Finished converting document 4_2024-12-05 in 0.06 sec.
2025-11-14 16:51:07,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,257 - INFO - Going to convert document batch...
2025-11-14 16:51:07,258 - INFO - Processing document 4_2024-12-31
2025-11-14 16:51:07,281 - INFO - Finished converting document 4_2024-12-31 in 0.05 sec.
2025-11-14 16:51:07,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,329 - INFO - Going to convert document batch...
2025-11-14 16:51:07,331 - INFO - Processing document 4_2025-02-03
2025-11-14 16:51:07,360 - INFO - Finished converting document 4_2025-02-03 in 0.06 sec.
2025-11-14 16:51:07,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,418 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTC\4_2024-12-05' --> 'data\processed_data\INTC\4_2024-12-05.md'
Converted 'data\edgar_documents\INTC\4_2024-12-31' --> 'data\processed_data\INTC\4_2024-12-31.md'
Converted 'data\edgar_documents\INTC\4_2025-02-03' --> 'data\processed_data\INTC\4_2025-02-03.md'


2025-11-14 16:51:07,419 - INFO - Processing document 4_2025-03-03
2025-11-14 16:51:07,463 - INFO - Finished converting document 4_2025-03-03 in 0.06 sec.
2025-11-14 16:51:07,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,547 - INFO - Going to convert document batch...
2025-11-14 16:51:07,550 - INFO - Processing document 4_2025-03-20
2025-11-14 16:51:07,588 - INFO - Finished converting document 4_2025-03-20 in 0.08 sec.
2025-11-14 16:51:07,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\4_2025-03-03' --> 'data\processed_data\INTC\4_2025-03-03.md'
Converted 'data\edgar_documents\INTC\4_2025-03-20' --> 'data\processed_data\INTC\4_2025-03-20.md'


2025-11-14 16:51:07,691 - INFO - Going to convert document batch...
2025-11-14 16:51:07,691 - INFO - Processing document 4_2025-03-25
2025-11-14 16:51:07,724 - INFO - Finished converting document 4_2025-03-25 in 0.11 sec.
2025-11-14 16:51:07,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,784 - INFO - Going to convert document batch...
2025-11-14 16:51:07,785 - INFO - Processing document 4_2025-04-01
2025-11-14 16:51:07,807 - INFO - Finished converting document 4_2025-04-01 in 0.05 sec.
2025-11-14 16:51:07,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,855 - INFO - Going to convert document batch...
2025-11-14 16:51:07,855 - INFO - Processing document 4_2025-05-02
2025-11-14 16:51:07,884 - INFO - Finished converting document 4_2025-05-02 in 0.05 sec.
2025-11-14 16:51:07,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:07,939 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTC\4_2025-03-25' --> 'data\processed_data\INTC\4_2025-03-25.md'
Converted 'data\edgar_documents\INTC\4_2025-04-01' --> 'data\processed_data\INTC\4_2025-04-01.md'
Converted 'data\edgar_documents\INTC\4_2025-05-02' --> 'data\processed_data\INTC\4_2025-05-02.md'


2025-11-14 16:51:07,940 - INFO - Processing document 4_2025-05-08
2025-11-14 16:51:07,979 - INFO - Finished converting document 4_2025-05-08 in 0.08 sec.
2025-11-14 16:51:08,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:08,030 - INFO - Going to convert document batch...
2025-11-14 16:51:08,031 - INFO - Processing document 4_2025-06-03
2025-11-14 16:51:08,057 - INFO - Finished converting document 4_2025-06-03 in 0.06 sec.
2025-11-14 16:51:08,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:08,105 - INFO - Going to convert document batch...
2025-11-14 16:51:08,106 - INFO - Processing document 4_2025-07-14
2025-11-14 16:51:08,133 - INFO - Finished converting document 4_2025-07-14 in 0.05 sec.


Converted 'data\edgar_documents\INTC\4_2025-05-08' --> 'data\processed_data\INTC\4_2025-05-08.md'
Converted 'data\edgar_documents\INTC\4_2025-06-03' --> 'data\processed_data\INTC\4_2025-06-03.md'


2025-11-14 16:51:08,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:08,289 - INFO - Going to convert document batch...
2025-11-14 16:51:08,290 - INFO - Processing document 4_2025-08-01
2025-11-14 16:51:08,319 - INFO - Finished converting document 4_2025-08-01 in 0.09 sec.
2025-11-14 16:51:08,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\4_2025-07-14' --> 'data\processed_data\INTC\4_2025-07-14.md'
Converted 'data\edgar_documents\INTC\4_2025-08-01' --> 'data\processed_data\INTC\4_2025-08-01.md'


2025-11-14 16:51:08,656 - INFO - Going to convert document batch...
2025-11-14 16:51:08,657 - INFO - Processing document 4_2025-09-04
2025-11-14 16:51:08,704 - INFO - Finished converting document 4_2025-09-04 in 0.36 sec.
2025-11-14 16:51:08,777 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:51:08,778 - ERROR - Input document 4_2025-09-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:51:08,780 - INFO - Going to convert document batch...
2025-11-14 16:51:08,793 - IN

Converted 'data\edgar_documents\INTC\4_2025-09-04' --> 'data\processed_data\INTC\4_2025-09-04.md'
Error processing data\edgar_documents\INTC\4_2025-09-05: File format not allowed: data\edgar_documents\INTC\4_2025-09-05
Converted 'data\edgar_documents\INTC\8-K_2023-01-26' --> 'data\processed_data\INTC\8-K_2023-01-26.md'


2025-11-14 16:51:08,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:08,955 - INFO - Going to convert document batch...
2025-11-14 16:51:08,957 - INFO - Processing document 8-K_2023-04-27
2025-11-14 16:51:08,986 - INFO - Finished converting document 8-K_2023-04-27 in 0.06 sec.


Converted 'data\edgar_documents\INTC\8-K_2023-02-10' --> 'data\processed_data\INTC\8-K_2023-02-10.md'
Converted 'data\edgar_documents\INTC\8-K_2023-04-27' --> 'data\processed_data\INTC\8-K_2023-04-27.md'


2025-11-14 16:51:09,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,143 - INFO - Going to convert document batch...
2025-11-14 16:51:09,144 - INFO - Processing document 8-K_2023-05-17
2025-11-14 16:51:09,200 - INFO - Finished converting document 8-K_2023-05-17 in 0.16 sec.
2025-11-14 16:51:09,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,284 - INFO - Going to convert document batch...
2025-11-14 16:51:09,284 - INFO - Processing document 8-K_2023-07-27
2025-11-14 16:51:09,303 - INFO - Finished converting document 8-K_2023-07-27 in 0.08 sec.
2025-11-14 16:51:09,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,340 - INFO - Going to convert document batch...
2025-11-14 16:51:09,341 - INFO - Processing document 8-K_2023-08-16
2025-11-14 16:51:09,360 - INFO - Finished converting document 8-K_2023-08-16 in 0.05 sec.
2025-11-14 16:51:09,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\INTC\8-K_2023-05-17' --> 'data\processed_data\INTC\8-K_2023-05-17.md'
Converted 'data\edgar_documents\INTC\8-K_2023-07-27' --> 'data\processed_data\INTC\8-K_2023-07-27.md'
Converted 'data\edgar_documents\INTC\8-K_2023-08-16' --> 'data\processed_data\INTC\8-K_2023-08-16.md'


2025-11-14 16:51:09,408 - INFO - Processing document 8-K_2023-10-05
2025-11-14 16:51:09,428 - INFO - Finished converting document 8-K_2023-10-05 in 0.05 sec.
2025-11-14 16:51:09,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,509 - INFO - Going to convert document batch...
2025-11-14 16:51:09,510 - INFO - Processing document 8-K_2023-10-26
2025-11-14 16:51:09,526 - INFO - Finished converting document 8-K_2023-10-26 in 0.06 sec.
2025-11-14 16:51:09,550 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,563 - INFO - Going to convert document batch...
2025-11-14 16:51:09,564 - INFO - Processing document 8-K_2023-10-30
2025-11-14 16:51:09,578 - INFO - Finished converting document 8-K_2023-10-30 in 0.05 sec.
2025-11-14 16:51:09,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,614 - INFO - Going to convert document batch...
2025-11-14 16:51:09,616 - INFO - Processing document 8-K_2023-12-05
2025-11-14 16:

Converted 'data\edgar_documents\INTC\8-K_2023-10-05' --> 'data\processed_data\INTC\8-K_2023-10-05.md'
Converted 'data\edgar_documents\INTC\8-K_2023-10-26' --> 'data\processed_data\INTC\8-K_2023-10-26.md'
Converted 'data\edgar_documents\INTC\8-K_2023-10-30' --> 'data\processed_data\INTC\8-K_2023-10-30.md'
Converted 'data\edgar_documents\INTC\8-K_2023-12-05' --> 'data\processed_data\INTC\8-K_2023-12-05.md'


2025-11-14 16:51:09,677 - INFO - Going to convert document batch...
2025-11-14 16:51:09,680 - INFO - Processing document 8-K_2024-01-03
2025-11-14 16:51:09,701 - INFO - Finished converting document 8-K_2024-01-03 in 0.06 sec.
2025-11-14 16:51:09,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,752 - INFO - Going to convert document batch...
2025-11-14 16:51:09,752 - INFO - Processing document 8-K_2024-01-25
2025-11-14 16:51:09,770 - INFO - Finished converting document 8-K_2024-01-25 in 0.05 sec.
2025-11-14 16:51:09,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,805 - INFO - Going to convert document batch...
2025-11-14 16:51:09,806 - INFO - Processing document 8-K_2024-02-16
2025-11-14 16:51:09,820 - INFO - Finished converting document 8-K_2024-02-16 in 0.03 sec.
2025-11-14 16:51:09,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,876 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\INTC\8-K_2024-01-03' --> 'data\processed_data\INTC\8-K_2024-01-03.md'
Converted 'data\edgar_documents\INTC\8-K_2024-01-25' --> 'data\processed_data\INTC\8-K_2024-01-25.md'
Converted 'data\edgar_documents\INTC\8-K_2024-02-16' --> 'data\processed_data\INTC\8-K_2024-02-16.md'


2025-11-14 16:51:09,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:09,938 - INFO - Going to convert document batch...
2025-11-14 16:51:09,940 - INFO - Processing document 8-K_2024-03-13
2025-11-14 16:51:09,974 - INFO - Finished converting document 8-K_2024-03-13 in 0.06 sec.
2025-11-14 16:51:10,002 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,009 - INFO - Going to convert document batch...
2025-11-14 16:51:10,010 - INFO - Processing document 8-K_2024-04-02
2025-11-14 16:51:10,027 - INFO - Finished converting document 8-K_2024-04-02 in 0.05 sec.
2025-11-14 16:51:10,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,061 - INFO - Going to convert document batch...
2025-11-14 16:51:10,063 - INFO - Processing document 8-K_2024-04-25
2025-11-14 16:51:10,080 - INFO - Finished converting document 8-K_2024-04-25 in 0.05 sec.
2025-11-14 16:51:10,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\8-K_2024-02-21' --> 'data\processed_data\INTC\8-K_2024-02-21.md'
Converted 'data\edgar_documents\INTC\8-K_2024-03-13' --> 'data\processed_data\INTC\8-K_2024-03-13.md'
Converted 'data\edgar_documents\INTC\8-K_2024-04-02' --> 'data\processed_data\INTC\8-K_2024-04-02.md'
Converted 'data\edgar_documents\INTC\8-K_2024-04-25' --> 'data\processed_data\INTC\8-K_2024-04-25.md'


2025-11-14 16:51:10,119 - INFO - Going to convert document batch...
2025-11-14 16:51:10,120 - INFO - Processing document 8-K_2024-05-08
2025-11-14 16:51:10,153 - INFO - Finished converting document 8-K_2024-05-08 in 0.06 sec.
2025-11-14 16:51:10,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,200 - INFO - Going to convert document batch...
2025-11-14 16:51:10,202 - INFO - Processing document 8-K_2024-05-09
2025-11-14 16:51:10,241 - INFO - Finished converting document 8-K_2024-05-09 in 0.08 sec.
2025-11-14 16:51:10,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,298 - INFO - Going to convert document batch...
2025-11-14 16:51:10,299 - INFO - Processing document 8-K_2024-06-04
2025-11-14 16:51:10,321 - INFO - Finished converting document 8-K_2024-06-04 in 0.05 sec.
2025-11-14 16:51:10,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\8-K_2024-05-08' --> 'data\processed_data\INTC\8-K_2024-05-08.md'
Converted 'data\edgar_documents\INTC\8-K_2024-05-09' --> 'data\processed_data\INTC\8-K_2024-05-09.md'
Converted 'data\edgar_documents\INTC\8-K_2024-06-04' --> 'data\processed_data\INTC\8-K_2024-06-04.md'


2025-11-14 16:51:10,372 - INFO - Going to convert document batch...
2025-11-14 16:51:10,373 - INFO - Processing document 8-K_2024-06-14
2025-11-14 16:51:10,392 - INFO - Finished converting document 8-K_2024-06-14 in 0.06 sec.
2025-11-14 16:51:10,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,434 - INFO - Going to convert document batch...
2025-11-14 16:51:10,434 - INFO - Processing document 8-K_2024-08-01
2025-11-14 16:51:10,455 - INFO - Finished converting document 8-K_2024-08-01 in 0.05 sec.
2025-11-14 16:51:10,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,488 - INFO - Going to convert document batch...
2025-11-14 16:51:10,489 - INFO - Processing document 8-K_2024-08-22
2025-11-14 16:51:10,505 - INFO - Finished converting document 8-K_2024-08-22 in 0.03 sec.
2025-11-14 16:51:10,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,538 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\INTC\8-K_2024-06-14' --> 'data\processed_data\INTC\8-K_2024-06-14.md'
Converted 'data\edgar_documents\INTC\8-K_2024-08-01' --> 'data\processed_data\INTC\8-K_2024-08-01.md'
Converted 'data\edgar_documents\INTC\8-K_2024-08-22' --> 'data\processed_data\INTC\8-K_2024-08-22.md'
Converted 'data\edgar_documents\INTC\8-K_2024-10-31' --> 'data\processed_data\INTC\8-K_2024-10-31.md'


2025-11-14 16:51:10,593 - INFO - Processing document 8-K_2024-11-27
2025-11-14 16:51:10,615 - INFO - Finished converting document 8-K_2024-11-27 in 0.05 sec.
2025-11-14 16:51:10,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,663 - INFO - Going to convert document batch...
2025-11-14 16:51:10,664 - INFO - Processing document 8-K_2024-12-03
2025-11-14 16:51:10,690 - INFO - Finished converting document 8-K_2024-12-03 in 0.06 sec.
2025-11-14 16:51:10,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,734 - INFO - Going to convert document batch...
2025-11-14 16:51:10,735 - INFO - Processing document 8-K_2024-12-05
2025-11-14 16:51:10,755 - INFO - Finished converting document 8-K_2024-12-05 in 0.05 sec.
2025-11-14 16:51:10,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,787 - INFO - Going to convert document batch...
2025-11-14 16:51:10,788 - INFO - Processing document 8-K_2025-01-30
2025-11-14 16:

Converted 'data\edgar_documents\INTC\8-K_2024-11-27' --> 'data\processed_data\INTC\8-K_2024-11-27.md'
Converted 'data\edgar_documents\INTC\8-K_2024-12-03' --> 'data\processed_data\INTC\8-K_2024-12-03.md'
Converted 'data\edgar_documents\INTC\8-K_2024-12-05' --> 'data\processed_data\INTC\8-K_2024-12-05.md'


2025-11-14 16:51:10,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,839 - INFO - Going to convert document batch...
2025-11-14 16:51:10,840 - INFO - Processing document 8-K_2025-02-28
2025-11-14 16:51:10,865 - INFO - Finished converting document 8-K_2025-02-28 in 0.05 sec.
2025-11-14 16:51:10,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,910 - INFO - Going to convert document batch...
2025-11-14 16:51:10,911 - INFO - Processing document 8-K_2025-03-14
2025-11-14 16:51:10,926 - INFO - Finished converting document 8-K_2025-03-14 in 0.05 sec.
2025-11-14 16:51:10,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:10,971 - INFO - Going to convert document batch...
2025-11-14 16:51:10,972 - INFO - Processing document 8-K_2025-03-28
2025-11-14 16:51:10,988 - INFO - Finished converting document 8-K_2025-03-28 in 0.05 sec.


Converted 'data\edgar_documents\INTC\8-K_2025-01-30' --> 'data\processed_data\INTC\8-K_2025-01-30.md'
Converted 'data\edgar_documents\INTC\8-K_2025-02-28' --> 'data\processed_data\INTC\8-K_2025-02-28.md'
Converted 'data\edgar_documents\INTC\8-K_2025-03-14' --> 'data\processed_data\INTC\8-K_2025-03-14.md'


2025-11-14 16:51:11,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,032 - INFO - Going to convert document batch...
2025-11-14 16:51:11,034 - INFO - Processing document 8-K_2025-04-14
2025-11-14 16:51:11,057 - INFO - Finished converting document 8-K_2025-04-14 in 0.05 sec.
2025-11-14 16:51:11,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,106 - INFO - Going to convert document batch...
2025-11-14 16:51:11,108 - INFO - Processing document 8-K_2025-04-17
2025-11-14 16:51:11,135 - INFO - Finished converting document 8-K_2025-04-17 in 0.05 sec.
2025-11-14 16:51:11,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,171 - INFO - Going to convert document batch...
2025-11-14 16:51:11,172 - INFO - Processing document 8-K_2025-04-24


Converted 'data\edgar_documents\INTC\8-K_2025-03-28' --> 'data\processed_data\INTC\8-K_2025-03-28.md'
Converted 'data\edgar_documents\INTC\8-K_2025-04-14' --> 'data\processed_data\INTC\8-K_2025-04-14.md'
Converted 'data\edgar_documents\INTC\8-K_2025-04-17' --> 'data\processed_data\INTC\8-K_2025-04-17.md'


2025-11-14 16:51:11,191 - INFO - Finished converting document 8-K_2025-04-24 in 0.05 sec.
2025-11-14 16:51:11,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,324 - INFO - Going to convert document batch...
2025-11-14 16:51:11,325 - INFO - Processing document 8-K_2025-04-30
2025-11-14 16:51:11,354 - INFO - Finished converting document 8-K_2025-04-30 in 0.16 sec.


Converted 'data\edgar_documents\INTC\8-K_2025-04-24' --> 'data\processed_data\INTC\8-K_2025-04-24.md'
Converted 'data\edgar_documents\INTC\8-K_2025-04-30' --> 'data\processed_data\INTC\8-K_2025-04-30.md'


2025-11-14 16:51:11,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,447 - INFO - Going to convert document batch...
2025-11-14 16:51:11,448 - INFO - Processing document 8-K_2025-05-09
2025-11-14 16:51:11,493 - INFO - Finished converting document 8-K_2025-05-09 in 0.12 sec.
2025-11-14 16:51:11,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,538 - INFO - Going to convert document batch...
2025-11-14 16:51:11,538 - INFO - Processing document 8-K_2025-07-24
2025-11-14 16:51:11,554 - INFO - Finished converting document 8-K_2025-07-24 in 0.03 sec.
2025-11-14 16:51:11,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,586 - INFO - Going to convert document batch...
2025-11-14 16:51:11,587 - INFO - Processing document 8-K_2025-08-14
2025-11-14 16:51:11,604 - INFO - Finished converting document 8-K_2025-08-14 in 0.05 sec.
2025-11-14 16:51:11,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\INTC\8-K_2025-05-09' --> 'data\processed_data\INTC\8-K_2025-05-09.md'
Converted 'data\edgar_documents\INTC\8-K_2025-07-24' --> 'data\processed_data\INTC\8-K_2025-07-24.md'
Converted 'data\edgar_documents\INTC\8-K_2025-08-14' --> 'data\processed_data\INTC\8-K_2025-08-14.md'
Converted 'data\edgar_documents\INTC\8-K_2025-08-21' --> 'data\processed_data\INTC\8-K_2025-08-21.md'


2025-11-14 16:51:11,700 - INFO - Processing document 8-K_2025-08-25
2025-11-14 16:51:11,726 - INFO - Finished converting document 8-K_2025-08-25 in 0.06 sec.
2025-11-14 16:51:11,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,769 - INFO - Going to convert document batch...
2025-11-14 16:51:11,770 - INFO - Processing document 8-K_2025-08-29
2025-11-14 16:51:11,785 - INFO - Finished converting document 8-K_2025-08-29 in 0.05 sec.
2025-11-14 16:51:11,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,819 - INFO - Going to convert document batch...
2025-11-14 16:51:11,819 - INFO - Processing document 8-K_2025-09-05
2025-11-14 16:51:11,837 - INFO - Finished converting document 8-K_2025-09-05 in 0.03 sec.
2025-11-14 16:51:11,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:11,869 - INFO - Going to convert document batch...
2025-11-14 16:51:11,870 - INFO - Processing document 8-K_2025-09-08
2025-11-14 16:

Converted 'data\edgar_documents\INTC\8-K_2025-08-25' --> 'data\processed_data\INTC\8-K_2025-08-25.md'
Converted 'data\edgar_documents\INTC\8-K_2025-08-29' --> 'data\processed_data\INTC\8-K_2025-08-29.md'
Converted 'data\edgar_documents\INTC\8-K_2025-09-05' --> 'data\processed_data\INTC\8-K_2025-09-05.md'
Converted 'data\edgar_documents\INTC\8-K_2025-09-08' --> 'data\processed_data\INTC\8-K_2025-09-08.md'


2025-11-14 16:51:11,925 - INFO - Processing document 8-K_2025-09-15
2025-11-14 16:51:11,966 - INFO - Finished converting document 8-K_2025-09-15 in 0.08 sec.
2025-11-14 16:51:12,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:12,023 - INFO - Going to convert document batch...
2025-11-14 16:51:12,025 - INFO - Processing document 8-K_2025-09-18
2025-11-14 16:51:12,051 - INFO - Finished converting document 8-K_2025-09-18 in 0.05 sec.
2025-11-14 16:51:12,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:12,090 - INFO - Going to convert document batch...
2025-11-14 16:51:12,090 - INFO - Processing document 8-K_2025-09-29
2025-11-14 16:51:12,103 - INFO - Finished converting document 8-K_2025-09-29 in 0.03 sec.
2025-11-14 16:51:12,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:12,133 - INFO - Going to convert document batch...
2025-11-14 16:51:12,134 - INFO - Processing document 8-K_2025-10-23
2025-11-14 16:

Converted 'data\edgar_documents\INTC\8-K_2025-09-15' --> 'data\processed_data\INTC\8-K_2025-09-15.md'
Converted 'data\edgar_documents\INTC\8-K_2025-09-18' --> 'data\processed_data\INTC\8-K_2025-09-18.md'
Converted 'data\edgar_documents\INTC\8-K_2025-09-29' --> 'data\processed_data\INTC\8-K_2025-09-29.md'
Converted 'data\edgar_documents\INTC\8-K_2025-10-23' --> 'data\processed_data\INTC\8-K_2025-10-23.md'


2025-11-14 16:51:12,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:51:13,441 - INFO - Going to convert document batch...
2025-11-14 16:51:13,442 - INFO - Processing document DEF-14A_2023-03-31
2025-11-14 16:51:20,357 - INFO - Finished converting document DEF-14A_2023-03-31 in 8.20 sec.
2025-11-14 16:51:22,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\DEF-14A_2023-03-31' --> 'data\processed_data\INTC\DEF-14A_2023-03-31.md'


2025-11-14 16:51:23,301 - INFO - Going to convert document batch...
2025-11-14 16:51:23,302 - INFO - Processing document DEF-14A_2024-03-28
2025-11-14 16:51:28,610 - INFO - Finished converting document DEF-14A_2024-03-28 in 6.05 sec.
2025-11-14 16:51:30,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\DEF-14A_2024-03-28' --> 'data\processed_data\INTC\DEF-14A_2024-03-28.md'


2025-11-14 16:51:31,232 - INFO - Going to convert document batch...
2025-11-14 16:51:31,233 - INFO - Processing document DEF-14A_2025-03-27
2025-11-14 16:51:35,108 - INFO - Finished converting document DEF-14A_2025-03-27 in 4.64 sec.
2025-11-14 16:51:36,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTC\DEF-14A_2025-03-27' --> 'data\processed_data\INTC\DEF-14A_2025-03-27.md'
Processed 128 new files. Errors: 5
Found 150 files to process in data\edgar_documents\INTU


2025-11-14 16:51:37,947 - INFO - Going to convert document batch...
2025-11-14 16:51:37,949 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:51:37,950 - INFO - Processing document 10-K_2023-09-01
2025-11-14 16:51:40,853 - INFO - Finished converting document 10-K_2023-09-01 in 4.19 sec.
2025-11-14 16:51:41,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-K_2023-09-01' --> 'data\processed_data\INTU\10-K_2023-09-01.md'


2025-11-14 16:51:42,871 - INFO - Going to convert document batch...
2025-11-14 16:51:42,873 - INFO - Processing document 10-K_2024-09-04
2025-11-14 16:51:45,763 - INFO - Finished converting document 10-K_2024-09-04 in 4.12 sec.
2025-11-14 16:51:46,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-K_2024-09-04' --> 'data\processed_data\INTU\10-K_2024-09-04.md'


2025-11-14 16:51:47,953 - INFO - Going to convert document batch...
2025-11-14 16:51:47,954 - INFO - Processing document 10-K_2025-09-03
2025-11-14 16:51:50,775 - INFO - Finished converting document 10-K_2025-09-03 in 4.16 sec.
2025-11-14 16:51:51,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-K_2025-09-03' --> 'data\processed_data\INTU\10-K_2025-09-03.md'


2025-11-14 16:51:52,768 - INFO - Going to convert document batch...
2025-11-14 16:51:52,769 - INFO - Processing document 10-Q_2023-02-23
2025-11-14 16:51:54,154 - INFO - Finished converting document 10-Q_2023-02-23 in 2.50 sec.
2025-11-14 16:51:54,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-Q_2023-02-23' --> 'data\processed_data\INTU\10-Q_2023-02-23.md'


2025-11-14 16:51:55,203 - INFO - Going to convert document batch...
2025-11-14 16:51:55,204 - INFO - Processing document 10-Q_2023-05-23
2025-11-14 16:51:57,184 - INFO - Finished converting document 10-Q_2023-05-23 in 2.52 sec.
2025-11-14 16:51:57,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-Q_2023-05-23' --> 'data\processed_data\INTU\10-Q_2023-05-23.md'


2025-11-14 16:51:58,173 - INFO - Going to convert document batch...
2025-11-14 16:51:58,174 - INFO - Processing document 10-Q_2023-11-28
2025-11-14 16:51:59,251 - INFO - Finished converting document 10-Q_2023-11-28 in 1.56 sec.
2025-11-14 16:52:00,002 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-Q_2023-11-28' --> 'data\processed_data\INTU\10-Q_2023-11-28.md'


2025-11-14 16:52:00,937 - INFO - Going to convert document batch...
2025-11-14 16:52:00,938 - INFO - Processing document 10-Q_2024-02-22
2025-11-14 16:52:02,576 - INFO - Finished converting document 10-Q_2024-02-22 in 2.64 sec.
2025-11-14 16:52:03,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-Q_2024-02-22' --> 'data\processed_data\INTU\10-Q_2024-02-22.md'


2025-11-14 16:52:03,722 - INFO - Going to convert document batch...
2025-11-14 16:52:03,722 - INFO - Processing document 10-Q_2024-05-23
2025-11-14 16:52:05,745 - INFO - Finished converting document 10-Q_2024-05-23 in 2.66 sec.
2025-11-14 16:52:06,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-Q_2024-05-23' --> 'data\processed_data\INTU\10-Q_2024-05-23.md'


2025-11-14 16:52:06,913 - INFO - Going to convert document batch...
2025-11-14 16:52:06,914 - INFO - Processing document 10-Q_2024-11-21
2025-11-14 16:52:08,202 - INFO - Finished converting document 10-Q_2024-11-21 in 1.97 sec.
2025-11-14 16:52:08,890 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-Q_2024-11-21' --> 'data\processed_data\INTU\10-Q_2024-11-21.md'


2025-11-14 16:52:09,892 - INFO - Going to convert document batch...
2025-11-14 16:52:09,893 - INFO - Processing document 10-Q_2025-02-25
2025-11-14 16:52:11,515 - INFO - Finished converting document 10-Q_2025-02-25 in 2.72 sec.
2025-11-14 16:52:12,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\10-Q_2025-02-25' --> 'data\processed_data\INTU\10-Q_2025-02-25.md'


2025-11-14 16:52:12,784 - INFO - Going to convert document batch...
2025-11-14 16:52:12,784 - INFO - Processing document 10-Q_2025-05-22
2025-11-14 16:52:14,594 - INFO - Finished converting document 10-Q_2025-05-22 in 2.38 sec.
2025-11-14 16:52:15,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:15,252 - INFO - Going to convert document batch...
2025-11-14 16:52:15,253 - INFO - Processing document 4_2023-01-04
2025-11-14 16:52:15,305 - INFO - Finished converting document 4_2023-01-04 in 0.11 sec.


Converted 'data\edgar_documents\INTU\10-Q_2025-05-22' --> 'data\processed_data\INTU\10-Q_2025-05-22.md'
Converted 'data\edgar_documents\INTU\4_2023-01-04' --> 'data\processed_data\INTU\4_2023-01-04.md'


2025-11-14 16:52:15,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:15,429 - INFO - Going to convert document batch...
2025-11-14 16:52:15,431 - INFO - Processing document 4_2023-01-10
2025-11-14 16:52:15,459 - INFO - Finished converting document 4_2023-01-10 in 0.09 sec.
2025-11-14 16:52:15,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:15,536 - INFO - Going to convert document batch...
2025-11-14 16:52:15,537 - INFO - Processing document 4_2023-01-20
2025-11-14 16:52:15,592 - INFO - Finished converting document 4_2023-01-20 in 0.11 sec.
2025-11-14 16:52:15,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:15,667 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTU\4_2023-01-10' --> 'data\processed_data\INTU\4_2023-01-10.md'
Converted 'data\edgar_documents\INTU\4_2023-01-20' --> 'data\processed_data\INTU\4_2023-01-20.md'


2025-11-14 16:52:15,668 - INFO - Processing document 4_2023-01-23
2025-11-14 16:52:15,692 - INFO - Finished converting document 4_2023-01-23 in 0.05 sec.
2025-11-14 16:52:15,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:15,753 - INFO - Going to convert document batch...
2025-11-14 16:52:15,754 - INFO - Processing document 4_2023-01-24
2025-11-14 16:52:15,778 - INFO - Finished converting document 4_2023-01-24 in 0.06 sec.
2025-11-14 16:52:15,843 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:15,859 - INFO - Going to convert document batch...
2025-11-14 16:52:15,860 - INFO - Processing document 4_2023-02-03
2025-11-14 16:52:15,899 - INFO - Finished converting document 4_2023-02-03 in 0.09 sec.


Converted 'data\edgar_documents\INTU\4_2023-01-23' --> 'data\processed_data\INTU\4_2023-01-23.md'
Converted 'data\edgar_documents\INTU\4_2023-01-24' --> 'data\processed_data\INTU\4_2023-01-24.md'


2025-11-14 16:52:15,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:15,974 - INFO - Going to convert document batch...
2025-11-14 16:52:15,976 - INFO - Processing document 4_2023-02-28
2025-11-14 16:52:16,008 - INFO - Finished converting document 4_2023-02-28 in 0.08 sec.


Converted 'data\edgar_documents\INTU\4_2023-02-03' --> 'data\processed_data\INTU\4_2023-02-03.md'
Converted 'data\edgar_documents\INTU\4_2023-02-28' --> 'data\processed_data\INTU\4_2023-02-28.md'


2025-11-14 16:52:16,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:16,165 - INFO - Going to convert document batch...
2025-11-14 16:52:16,166 - INFO - Processing document 4_2023-03-02
2025-11-14 16:52:16,190 - INFO - Finished converting document 4_2023-03-02 in 0.08 sec.
2025-11-14 16:52:16,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:16,257 - INFO - Going to convert document batch...
2025-11-14 16:52:16,257 - INFO - Processing document 4_2023-03-06
2025-11-14 16:52:16,280 - INFO - Finished converting document 4_2023-03-06 in 0.06 sec.
2025-11-14 16:52:16,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:16,332 - INFO - Going to convert document batch...
2025-11-14 16:52:16,333 - INFO - Processing document 4_2023-03-08
2025-11-14 16:52:16,355 - INFO - Finished converting document 4_2023-03-08 in 0.05 sec.
2025-11-14 16:52:16,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\4_2023-03-02' --> 'data\processed_data\INTU\4_2023-03-02.md'
Converted 'data\edgar_documents\INTU\4_2023-03-06' --> 'data\processed_data\INTU\4_2023-03-06.md'
Converted 'data\edgar_documents\INTU\4_2023-03-08' --> 'data\processed_data\INTU\4_2023-03-08.md'


2025-11-14 16:52:16,432 - INFO - Going to convert document batch...
2025-11-14 16:52:16,433 - INFO - Processing document 4_2023-04-04
2025-11-14 16:52:16,477 - INFO - Finished converting document 4_2023-04-04 in 0.09 sec.
2025-11-14 16:52:16,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:16,679 - INFO - Going to convert document batch...
2025-11-14 16:52:16,680 - INFO - Processing document 4_2023-05-08
2025-11-14 16:52:16,722 - INFO - Finished converting document 4_2023-05-08 in 0.11 sec.
2025-11-14 16:52:16,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:16,798 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTU\4_2023-04-04' --> 'data\processed_data\INTU\4_2023-04-04.md'
Converted 'data\edgar_documents\INTU\4_2023-05-08' --> 'data\processed_data\INTU\4_2023-05-08.md'


2025-11-14 16:52:16,801 - INFO - Processing document 4_2023-05-09
2025-11-14 16:52:16,846 - INFO - Finished converting document 4_2023-05-09 in 0.09 sec.
2025-11-14 16:52:16,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:16,949 - INFO - Going to convert document batch...
2025-11-14 16:52:16,949 - INFO - Processing document 4_2023-05-30
2025-11-14 16:52:16,969 - INFO - Finished converting document 4_2023-05-30 in 0.08 sec.
2025-11-14 16:52:17,013 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:17,029 - INFO - Going to convert document batch...
2025-11-14 16:52:17,030 - INFO - Processing document 4_2023-06-05
2025-11-14 16:52:17,070 - INFO - Finished converting document 4_2023-06-05 in 0.06 sec.


Converted 'data\edgar_documents\INTU\4_2023-05-09' --> 'data\processed_data\INTU\4_2023-05-09.md'
Converted 'data\edgar_documents\INTU\4_2023-05-30' --> 'data\processed_data\INTU\4_2023-05-30.md'


2025-11-14 16:52:17,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:17,173 - INFO - Going to convert document batch...
2025-11-14 16:52:17,175 - INFO - Processing document 4_2023-07-03
2025-11-14 16:52:17,226 - INFO - Finished converting document 4_2023-07-03 in 0.09 sec.


Converted 'data\edgar_documents\INTU\4_2023-06-05' --> 'data\processed_data\INTU\4_2023-06-05.md'


2025-11-14 16:52:17,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:17,392 - INFO - Going to convert document batch...
2025-11-14 16:52:17,393 - INFO - Processing document 4_2023-07-05
2025-11-14 16:52:17,444 - INFO - Finished converting document 4_2023-07-05 in 0.09 sec.
2025-11-14 16:52:17,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:17,518 - INFO - Going to convert document batch...
2025-11-14 16:52:17,519 - INFO - Processing document 4_2023-07-31


Converted 'data\edgar_documents\INTU\4_2023-07-03' --> 'data\processed_data\INTU\4_2023-07-03.md'
Converted 'data\edgar_documents\INTU\4_2023-07-05' --> 'data\processed_data\INTU\4_2023-07-05.md'


2025-11-14 16:52:17,552 - INFO - Finished converting document 4_2023-07-31 in 0.08 sec.
2025-11-14 16:52:17,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:17,646 - INFO - Going to convert document batch...
2025-11-14 16:52:17,649 - INFO - Processing document 4_2023-08-02
2025-11-14 16:52:17,671 - INFO - Finished converting document 4_2023-08-02 in 0.08 sec.
2025-11-14 16:52:17,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:17,733 - INFO - Going to convert document batch...
2025-11-14 16:52:17,734 - INFO - Processing document 4_2023-08-15
2025-11-14 16:52:17,767 - INFO - Finished converting document 4_2023-08-15 in 0.08 sec.


Converted 'data\edgar_documents\INTU\4_2023-07-31' --> 'data\processed_data\INTU\4_2023-07-31.md'
Converted 'data\edgar_documents\INTU\4_2023-08-02' --> 'data\processed_data\INTU\4_2023-08-02.md'
Converted 'data\edgar_documents\INTU\4_2023-08-15' --> 'data\processed_data\INTU\4_2023-08-15.md'


2025-11-14 16:52:17,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:17,846 - INFO - Going to convert document batch...
2025-11-14 16:52:17,847 - INFO - Processing document 4_2023-08-30
2025-11-14 16:52:17,879 - INFO - Finished converting document 4_2023-08-30 in 0.08 sec.
2025-11-14 16:52:18,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:18,032 - INFO - Going to convert document batch...
2025-11-14 16:52:18,040 - INFO - Processing document 4_2023-09-06
2025-11-14 16:52:18,070 - INFO - Finished converting document 4_2023-09-06 in 0.16 sec.


Converted 'data\edgar_documents\INTU\4_2023-08-30' --> 'data\processed_data\INTU\4_2023-08-30.md'


2025-11-14 16:52:18,121 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:18,142 - INFO - Going to convert document batch...
2025-11-14 16:52:18,143 - INFO - Processing document 4_2023-09-07
2025-11-14 16:52:18,183 - INFO - Finished converting document 4_2023-09-07 in 0.09 sec.
2025-11-14 16:52:18,247 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:52:18,248 - ERROR - Input document 4_2023-09-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:52

Converted 'data\edgar_documents\INTU\4_2023-09-06' --> 'data\processed_data\INTU\4_2023-09-06.md'
Converted 'data\edgar_documents\INTU\4_2023-09-07' --> 'data\processed_data\INTU\4_2023-09-07.md'
Error processing data\edgar_documents\INTU\4_2023-09-12: File format not allowed: data\edgar_documents\INTU\4_2023-09-12


2025-11-14 16:52:18,358 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:52:18,359 - ERROR - Input document 4_2023-09-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:52:18,361 - INFO - Going to convert document batch...
2025-11-14 16:52:18,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:18,399 - INFO - Going to convert document batch...
2025-11-14 16:52:18,435 - INFO - Processing document 4_2023-10-03
2025-11-14 16:52:18,506 - INFO - Fin

Converted 'data\edgar_documents\INTU\4_2023-09-13' --> 'data\processed_data\INTU\4_2023-09-13.md'
Error processing data\edgar_documents\INTU\4_2023-09-14: File format not allowed: data\edgar_documents\INTU\4_2023-09-14


2025-11-14 16:52:18,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:18,585 - INFO - Going to convert document batch...
2025-11-14 16:52:18,586 - INFO - Processing document 4_2023-10-04
2025-11-14 16:52:18,615 - INFO - Finished converting document 4_2023-10-04 in 0.05 sec.
2025-11-14 16:52:18,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:18,687 - INFO - Going to convert document batch...
2025-11-14 16:52:18,688 - INFO - Processing document 4_2023-10-06
2025-11-14 16:52:18,707 - INFO - Finished converting document 4_2023-10-06 in 0.06 sec.
2025-11-14 16:52:18,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:18,748 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTU\4_2023-10-03' --> 'data\processed_data\INTU\4_2023-10-03.md'
Converted 'data\edgar_documents\INTU\4_2023-10-04' --> 'data\processed_data\INTU\4_2023-10-04.md'
Converted 'data\edgar_documents\INTU\4_2023-10-06' --> 'data\processed_data\INTU\4_2023-10-06.md'


2025-11-14 16:52:18,749 - INFO - Processing document 4_2023-10-31
2025-11-14 16:52:18,781 - INFO - Finished converting document 4_2023-10-31 in 0.06 sec.
2025-11-14 16:52:18,833 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:18,845 - INFO - Going to convert document batch...
2025-11-14 16:52:18,846 - INFO - Processing document 4_2023-11-01
2025-11-14 16:52:18,871 - INFO - Finished converting document 4_2023-11-01 in 0.06 sec.
2025-11-14 16:52:18,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:18,934 - INFO - Going to convert document batch...
2025-11-14 16:52:18,934 - INFO - Processing document 4_2023-12-05
2025-11-14 16:52:18,958 - INFO - Finished converting document 4_2023-12-05 in 0.06 sec.
2025-11-14 16:52:19,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\4_2023-10-31' --> 'data\processed_data\INTU\4_2023-10-31.md'
Converted 'data\edgar_documents\INTU\4_2023-11-01' --> 'data\processed_data\INTU\4_2023-11-01.md'
Converted 'data\edgar_documents\INTU\4_2023-12-05' --> 'data\processed_data\INTU\4_2023-12-05.md'


2025-11-14 16:52:19,025 - INFO - Going to convert document batch...
2025-11-14 16:52:19,026 - INFO - Processing document 4_2023-12-08
2025-11-14 16:52:19,089 - INFO - Finished converting document 4_2023-12-08 in 0.11 sec.
2025-11-14 16:52:19,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:19,181 - INFO - Going to convert document batch...
2025-11-14 16:52:19,182 - INFO - Processing document 4_2023-12-12
2025-11-14 16:52:19,222 - INFO - Finished converting document 4_2023-12-12 in 0.08 sec.
2025-11-14 16:52:19,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:19,317 - INFO - Going to convert document batch...
2025-11-14 16:52:19,318 - INFO - Processing document 4_2023-12-20


Converted 'data\edgar_documents\INTU\4_2023-12-08' --> 'data\processed_data\INTU\4_2023-12-08.md'
Converted 'data\edgar_documents\INTU\4_2023-12-12' --> 'data\processed_data\INTU\4_2023-12-12.md'


2025-11-14 16:52:19,349 - INFO - Finished converting document 4_2023-12-20 in 0.08 sec.
2025-11-14 16:52:19,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:19,412 - INFO - Going to convert document batch...
2025-11-14 16:52:19,413 - INFO - Processing document 4_2023-12-22
2025-11-14 16:52:19,442 - INFO - Finished converting document 4_2023-12-22 in 0.06 sec.
2025-11-14 16:52:19,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:19,503 - INFO - Going to convert document batch...
2025-11-14 16:52:19,503 - INFO - Processing document 4_2024-01-02
2025-11-14 16:52:19,547 - INFO - Finished converting document 4_2024-01-02 in 0.09 sec.


Converted 'data\edgar_documents\INTU\4_2023-12-20' --> 'data\processed_data\INTU\4_2023-12-20.md'
Converted 'data\edgar_documents\INTU\4_2023-12-22' --> 'data\processed_data\INTU\4_2023-12-22.md'


2025-11-14 16:52:19,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:19,629 - INFO - Going to convert document batch...
2025-11-14 16:52:19,630 - INFO - Processing document 4_2024-01-04
2025-11-14 16:52:19,664 - INFO - Finished converting document 4_2024-01-04 in 0.08 sec.
2025-11-14 16:52:19,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:19,745 - INFO - Going to convert document batch...
2025-11-14 16:52:19,745 - INFO - Processing document 4_2024-01-09


Converted 'data\edgar_documents\INTU\4_2024-01-02' --> 'data\processed_data\INTU\4_2024-01-02.md'
Converted 'data\edgar_documents\INTU\4_2024-01-04' --> 'data\processed_data\INTU\4_2024-01-04.md'


2025-11-14 16:52:19,798 - INFO - Finished converting document 4_2024-01-09 in 0.11 sec.
2025-11-14 16:52:19,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:19,896 - INFO - Going to convert document batch...
2025-11-14 16:52:19,896 - INFO - Processing document 4_2024-01-10
2025-11-14 16:52:19,915 - INFO - Finished converting document 4_2024-01-10 in 0.05 sec.
2025-11-14 16:52:19,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:19,972 - INFO - Going to convert document batch...
2025-11-14 16:52:19,973 - INFO - Processing document 4_2024-01-22
2025-11-14 16:52:20,004 - INFO - Finished converting document 4_2024-01-22 in 0.06 sec.
2025-11-14 16:52:20,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\4_2024-01-09' --> 'data\processed_data\INTU\4_2024-01-09.md'
Converted 'data\edgar_documents\INTU\4_2024-01-10' --> 'data\processed_data\INTU\4_2024-01-10.md'
Converted 'data\edgar_documents\INTU\4_2024-01-22' --> 'data\processed_data\INTU\4_2024-01-22.md'


2025-11-14 16:52:20,088 - INFO - Going to convert document batch...
2025-11-14 16:52:20,089 - INFO - Processing document 4_2024-02-27
2025-11-14 16:52:20,131 - INFO - Finished converting document 4_2024-02-27 in 0.09 sec.
2025-11-14 16:52:20,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:20,203 - INFO - Going to convert document batch...
2025-11-14 16:52:20,203 - INFO - Processing document 4_2024-03-04
2025-11-14 16:52:20,228 - INFO - Finished converting document 4_2024-03-04 in 0.05 sec.
2025-11-14 16:52:20,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:20,309 - INFO - Going to convert document batch...
2025-11-14 16:52:20,309 - INFO - Processing document 4_2024-03-21
2025-11-14 16:52:20,336 - INFO - Finished converting document 4_2024-03-21 in 0.08 sec.


Converted 'data\edgar_documents\INTU\4_2024-02-27' --> 'data\processed_data\INTU\4_2024-02-27.md'
Converted 'data\edgar_documents\INTU\4_2024-03-04' --> 'data\processed_data\INTU\4_2024-03-04.md'


2025-11-14 16:52:20,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:20,419 - INFO - Going to convert document batch...
2025-11-14 16:52:20,420 - INFO - Processing document 4_2024-04-02
2025-11-14 16:52:20,480 - INFO - Finished converting document 4_2024-04-02 in 0.11 sec.
2025-11-14 16:52:20,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\4_2024-03-21' --> 'data\processed_data\INTU\4_2024-03-21.md'
Converted 'data\edgar_documents\INTU\4_2024-04-02' --> 'data\processed_data\INTU\4_2024-04-02.md'


2025-11-14 16:52:20,579 - INFO - Going to convert document batch...
2025-11-14 16:52:20,579 - INFO - Processing document 4_2024-05-06
2025-11-14 16:52:20,610 - INFO - Finished converting document 4_2024-05-06 in 0.06 sec.
2025-11-14 16:52:20,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:20,685 - INFO - Going to convert document batch...
2025-11-14 16:52:20,685 - INFO - Processing document 4_2024-05-29
2025-11-14 16:52:20,712 - INFO - Finished converting document 4_2024-05-29 in 0.05 sec.
2025-11-14 16:52:20,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:20,794 - INFO - Going to convert document batch...
2025-11-14 16:52:20,795 - INFO - Processing document 4_2024-05-30


Converted 'data\edgar_documents\INTU\4_2024-05-06' --> 'data\processed_data\INTU\4_2024-05-06.md'
Converted 'data\edgar_documents\INTU\4_2024-05-29' --> 'data\processed_data\INTU\4_2024-05-29.md'


2025-11-14 16:52:20,879 - INFO - Finished converting document 4_2024-05-30 in 0.14 sec.
2025-11-14 16:52:20,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:21,005 - INFO - Going to convert document batch...
2025-11-14 16:52:21,006 - INFO - Processing document 4_2024-05-31
2025-11-14 16:52:21,049 - INFO - Finished converting document 4_2024-05-31 in 0.09 sec.
2025-11-14 16:52:21,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:21,115 - INFO - Going to convert document batch...
2025-11-14 16:52:21,116 - INFO - Processing document 4_2024-06-04


Converted 'data\edgar_documents\INTU\4_2024-05-30' --> 'data\processed_data\INTU\4_2024-05-30.md'
Converted 'data\edgar_documents\INTU\4_2024-05-31' --> 'data\processed_data\INTU\4_2024-05-31.md'


2025-11-14 16:52:21,142 - INFO - Finished converting document 4_2024-06-04 in 0.05 sec.
2025-11-14 16:52:21,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:21,225 - INFO - Going to convert document batch...
2025-11-14 16:52:21,226 - INFO - Processing document 4_2024-06-12
2025-11-14 16:52:21,304 - INFO - Finished converting document 4_2024-06-12 in 0.14 sec.


Converted 'data\edgar_documents\INTU\4_2024-06-04' --> 'data\processed_data\INTU\4_2024-06-04.md'


2025-11-14 16:52:21,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:21,419 - INFO - Going to convert document batch...
2025-11-14 16:52:21,420 - INFO - Processing document 4_2024-07-03
2025-11-14 16:52:21,467 - INFO - Finished converting document 4_2024-07-03 in 0.11 sec.
2025-11-14 16:52:21,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:21,546 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTU\4_2024-06-12' --> 'data\processed_data\INTU\4_2024-06-12.md'
Converted 'data\edgar_documents\INTU\4_2024-07-03' --> 'data\processed_data\INTU\4_2024-07-03.md'


2025-11-14 16:52:21,546 - INFO - Processing document 4_2024-07-29
2025-11-14 16:52:21,568 - INFO - Finished converting document 4_2024-07-29 in 0.06 sec.
2025-11-14 16:52:21,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:21,633 - INFO - Going to convert document batch...
2025-11-14 16:52:21,634 - INFO - Processing document 4_2024-08-13
2025-11-14 16:52:21,657 - INFO - Finished converting document 4_2024-08-13 in 0.06 sec.
2025-11-14 16:52:21,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:21,710 - INFO - Going to convert document batch...
2025-11-14 16:52:21,711 - INFO - Processing document 4_2024-08-15
2025-11-14 16:52:21,736 - INFO - Finished converting document 4_2024-08-15 in 0.05 sec.
2025-11-14 16:52:21,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\4_2024-07-29' --> 'data\processed_data\INTU\4_2024-07-29.md'
Converted 'data\edgar_documents\INTU\4_2024-08-13' --> 'data\processed_data\INTU\4_2024-08-13.md'
Converted 'data\edgar_documents\INTU\4_2024-08-15' --> 'data\processed_data\INTU\4_2024-08-15.md'


2025-11-14 16:52:21,799 - INFO - Going to convert document batch...
2025-11-14 16:52:21,800 - INFO - Processing document 4_2024-08-27
2025-11-14 16:52:22,310 - INFO - Finished converting document 4_2024-08-27 in 0.55 sec.
2025-11-14 16:52:22,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:22,393 - INFO - Going to convert document batch...
2025-11-14 16:52:22,393 - INFO - Processing document 4_2024-08-28
2025-11-14 16:52:22,468 - INFO - Finished converting document 4_2024-08-28 in 0.14 sec.


Converted 'data\edgar_documents\INTU\4_2024-08-27' --> 'data\processed_data\INTU\4_2024-08-27.md'


2025-11-14 16:52:22,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:22,564 - INFO - Going to convert document batch...
2025-11-14 16:52:22,565 - INFO - Processing document 4_2024-09-04
2025-11-14 16:52:22,688 - INFO - Finished converting document 4_2024-09-04 in 0.16 sec.


Converted 'data\edgar_documents\INTU\4_2024-08-28' --> 'data\processed_data\INTU\4_2024-08-28.md'
Converted 'data\edgar_documents\INTU\4_2024-09-04' --> 'data\processed_data\INTU\4_2024-09-04.md'


2025-11-14 16:52:22,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:22,777 - INFO - Going to convert document batch...
2025-11-14 16:52:22,778 - INFO - Processing document 4_2024-09-11
2025-11-14 16:52:22,813 - INFO - Finished converting document 4_2024-09-11 in 0.09 sec.
2025-11-14 16:52:22,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:22,889 - INFO - Going to convert document batch...
2025-11-14 16:52:22,890 - INFO - Processing document 4_2024-09-19
2025-11-14 16:52:22,953 - INFO - Finished converting document 4_2024-09-19 in 0.11 sec.
2025-11-14 16:52:23,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\4_2024-09-11' --> 'data\processed_data\INTU\4_2024-09-11.md'
Converted 'data\edgar_documents\INTU\4_2024-09-19' --> 'data\processed_data\INTU\4_2024-09-19.md'


2025-11-14 16:52:23,056 - INFO - Going to convert document batch...
2025-11-14 16:52:23,057 - INFO - Processing document 4_2024-09-24
2025-11-14 16:52:23,184 - INFO - Finished converting document 4_2024-09-24 in 0.20 sec.
2025-11-14 16:52:23,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:23,293 - INFO - Going to convert document batch...
2025-11-14 16:52:23,294 - INFO - Processing document 4_2024-10-03
2025-11-14 16:52:23,338 - INFO - Finished converting document 4_2024-10-03 in 0.09 sec.
2025-11-14 16:52:23,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\4_2024-09-24' --> 'data\processed_data\INTU\4_2024-09-24.md'
Converted 'data\edgar_documents\INTU\4_2024-10-03' --> 'data\processed_data\INTU\4_2024-10-03.md'


2025-11-14 16:52:23,443 - INFO - Going to convert document batch...
2025-11-14 16:52:23,445 - INFO - Processing document 4_2024-10-11
2025-11-14 16:52:23,475 - INFO - Finished converting document 4_2024-10-11 in 0.09 sec.
2025-11-14 16:52:23,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:23,549 - INFO - Going to convert document batch...
2025-11-14 16:52:23,550 - INFO - Processing document 4_2024-11-04
2025-11-14 16:52:23,573 - INFO - Finished converting document 4_2024-11-04 in 0.05 sec.
2025-11-14 16:52:23,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:23,681 - INFO - Going to convert document batch...
2025-11-14 16:52:23,682 - INFO - Processing document 4_2024-11-27


Converted 'data\edgar_documents\INTU\4_2024-10-11' --> 'data\processed_data\INTU\4_2024-10-11.md'
Converted 'data\edgar_documents\INTU\4_2024-11-04' --> 'data\processed_data\INTU\4_2024-11-04.md'


2025-11-14 16:52:23,757 - INFO - Finished converting document 4_2024-11-27 in 0.16 sec.
2025-11-14 16:52:23,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:23,850 - INFO - Going to convert document batch...
2025-11-14 16:52:23,851 - INFO - Processing document 4_2024-12-03
2025-11-14 16:52:23,875 - INFO - Finished converting document 4_2024-12-03 in 0.05 sec.
2025-11-14 16:52:23,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:23,950 - INFO - Going to convert document batch...
2025-11-14 16:52:23,951 - INFO - Processing document 4_2024-12-09
2025-11-14 16:52:23,999 - INFO - Finished converting document 4_2024-12-09 in 0.11 sec.


Converted 'data\edgar_documents\INTU\4_2024-11-27' --> 'data\processed_data\INTU\4_2024-11-27.md'
Converted 'data\edgar_documents\INTU\4_2024-12-03' --> 'data\processed_data\INTU\4_2024-12-03.md'


2025-11-14 16:52:24,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:24,092 - INFO - Going to convert document batch...
2025-11-14 16:52:24,092 - INFO - Processing document 4_2024-12-10
2025-11-14 16:52:24,254 - INFO - Finished converting document 4_2024-12-10 in 0.20 sec.


Converted 'data\edgar_documents\INTU\4_2024-12-09' --> 'data\processed_data\INTU\4_2024-12-09.md'


2025-11-14 16:52:24,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:24,334 - INFO - Going to convert document batch...
2025-11-14 16:52:24,335 - INFO - Processing document 4_2024-12-11
2025-11-14 16:52:24,362 - INFO - Finished converting document 4_2024-12-11 in 0.06 sec.
2025-11-14 16:52:24,496 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\4_2024-12-10' --> 'data\processed_data\INTU\4_2024-12-10.md'
Converted 'data\edgar_documents\INTU\4_2024-12-11' --> 'data\processed_data\INTU\4_2024-12-11.md'


2025-11-14 16:52:24,515 - INFO - Going to convert document batch...
2025-11-14 16:52:24,516 - INFO - Processing document 4_2024-12-13
2025-11-14 16:52:24,561 - INFO - Finished converting document 4_2024-12-13 in 0.17 sec.
2025-11-14 16:52:24,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:24,667 - INFO - Going to convert document batch...
2025-11-14 16:52:24,668 - INFO - Processing document 4_2024-12-16
2025-11-14 16:52:24,730 - INFO - Finished converting document 4_2024-12-16 in 0.14 sec.


Converted 'data\edgar_documents\INTU\4_2024-12-13' --> 'data\processed_data\INTU\4_2024-12-13.md'
Converted 'data\edgar_documents\INTU\4_2024-12-16' --> 'data\processed_data\INTU\4_2024-12-16.md'


2025-11-14 16:52:24,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:24,839 - INFO - Going to convert document batch...
2025-11-14 16:52:24,840 - INFO - Processing document 4_2024-12-20
2025-11-14 16:52:24,917 - INFO - Finished converting document 4_2024-12-20 in 0.16 sec.
2025-11-14 16:52:25,013 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:25,049 - INFO - Going to convert document batch...
2025-11-14 16:52:25,050 - INFO - Processing document 4_2025-01-02
2025-11-14 16:52:25,134 - INFO - Finished converting document 4_2025-01-02 in 0.14 sec.


Converted 'data\edgar_documents\INTU\4_2024-12-20' --> 'data\processed_data\INTU\4_2024-12-20.md'
Converted 'data\edgar_documents\INTU\4_2025-01-02' --> 'data\processed_data\INTU\4_2025-01-02.md'


2025-11-14 16:52:25,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:25,217 - INFO - Going to convert document batch...
2025-11-14 16:52:25,218 - INFO - Processing document 4_2025-01-03
2025-11-14 16:52:25,354 - INFO - Finished converting document 4_2025-01-03 in 0.17 sec.
2025-11-14 16:52:25,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:25,432 - INFO - Going to convert document batch...
2025-11-14 16:52:25,433 - INFO - Processing document 4_2025-01-06
2025-11-14 16:52:25,493 - INFO - Finished converting document 4_2025-01-06 in 0.09 sec.
2025-11-14 16:52:25,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:25,585 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTU\4_2025-01-03' --> 'data\processed_data\INTU\4_2025-01-03.md'
Converted 'data\edgar_documents\INTU\4_2025-01-06' --> 'data\processed_data\INTU\4_2025-01-06.md'


2025-11-14 16:52:25,587 - INFO - Processing document 4_2025-01-08
2025-11-14 16:52:25,630 - INFO - Finished converting document 4_2025-01-08 in 0.09 sec.
2025-11-14 16:52:25,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:25,714 - INFO - Going to convert document batch...
2025-11-14 16:52:25,715 - INFO - Processing document 4_2025-01-10
2025-11-14 16:52:25,749 - INFO - Finished converting document 4_2025-01-10 in 0.08 sec.
2025-11-14 16:52:25,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:25,813 - INFO - Going to convert document batch...
2025-11-14 16:52:25,814 - INFO - Processing document 4_2025-01-13
2025-11-14 16:52:25,834 - INFO - Finished converting document 4_2025-01-13 in 0.06 sec.


Converted 'data\edgar_documents\INTU\4_2025-01-08' --> 'data\processed_data\INTU\4_2025-01-08.md'
Converted 'data\edgar_documents\INTU\4_2025-01-10' --> 'data\processed_data\INTU\4_2025-01-10.md'


2025-11-14 16:52:25,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:25,898 - INFO - Going to convert document batch...
2025-11-14 16:52:25,898 - INFO - Processing document 4_2025-01-22
2025-11-14 16:52:26,008 - INFO - Finished converting document 4_2025-01-22 in 0.14 sec.


Converted 'data\edgar_documents\INTU\4_2025-01-13' --> 'data\processed_data\INTU\4_2025-01-13.md'
Converted 'data\edgar_documents\INTU\4_2025-01-22' --> 'data\processed_data\INTU\4_2025-01-22.md'


2025-11-14 16:52:26,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:26,092 - INFO - Going to convert document batch...
2025-11-14 16:52:26,093 - INFO - Processing document 4_2025-01-28
2025-11-14 16:52:26,122 - INFO - Finished converting document 4_2025-01-28 in 0.09 sec.
2025-11-14 16:52:26,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:26,205 - INFO - Going to convert document batch...
2025-11-14 16:52:26,206 - INFO - Processing document 4_2025-03-03
2025-11-14 16:52:26,258 - INFO - Finished converting document 4_2025-03-03 in 0.09 sec.
2025-11-14 16:52:26,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:26,345 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTU\4_2025-01-28' --> 'data\processed_data\INTU\4_2025-01-28.md'
Converted 'data\edgar_documents\INTU\4_2025-03-03' --> 'data\processed_data\INTU\4_2025-03-03.md'


2025-11-14 16:52:26,346 - INFO - Processing document 4_2025-03-04
2025-11-14 16:52:26,379 - INFO - Finished converting document 4_2025-03-04 in 0.06 sec.
2025-11-14 16:52:26,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:26,539 - INFO - Going to convert document batch...
2025-11-14 16:52:26,540 - INFO - Processing document 4_2025-03-12


Converted 'data\edgar_documents\INTU\4_2025-03-04' --> 'data\processed_data\INTU\4_2025-03-04.md'


2025-11-14 16:52:26,601 - INFO - Finished converting document 4_2025-03-12 in 0.19 sec.
2025-11-14 16:52:26,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:26,705 - INFO - Going to convert document batch...
2025-11-14 16:52:26,706 - INFO - Processing document 4_2025-03-21
2025-11-14 16:52:26,729 - INFO - Finished converting document 4_2025-03-21 in 0.08 sec.
2025-11-14 16:52:26,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:26,789 - INFO - Going to convert document batch...
2025-11-14 16:52:26,789 - INFO - Processing document 4_2025-03-24
2025-11-14 16:52:26,829 - INFO - Finished converting document 4_2025-03-24 in 0.08 sec.


Converted 'data\edgar_documents\INTU\4_2025-03-12' --> 'data\processed_data\INTU\4_2025-03-12.md'
Converted 'data\edgar_documents\INTU\4_2025-03-21' --> 'data\processed_data\INTU\4_2025-03-21.md'


2025-11-14 16:52:26,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:26,904 - INFO - Going to convert document batch...
2025-11-14 16:52:26,905 - INFO - Processing document 4_2025-03-25
2025-11-14 16:52:26,933 - INFO - Finished converting document 4_2025-03-25 in 0.08 sec.
2025-11-14 16:52:26,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:26,993 - INFO - Going to convert document batch...
2025-11-14 16:52:26,994 - INFO - Processing document 4_2025-04-03


Converted 'data\edgar_documents\INTU\4_2025-03-24' --> 'data\processed_data\INTU\4_2025-03-24.md'
Converted 'data\edgar_documents\INTU\4_2025-03-25' --> 'data\processed_data\INTU\4_2025-03-25.md'


2025-11-14 16:52:27,330 - INFO - Finished converting document 4_2025-04-03 in 0.38 sec.
2025-11-14 16:52:27,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:27,407 - INFO - Going to convert document batch...
2025-11-14 16:52:27,408 - INFO - Processing document 4_2025-05-06
2025-11-14 16:52:27,457 - INFO - Finished converting document 4_2025-05-06 in 0.09 sec.
2025-11-14 16:52:27,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:27,534 - INFO - Going to convert document batch...
2025-11-14 16:52:27,534 - INFO - Processing document 4_2025-05-12


Converted 'data\edgar_documents\INTU\4_2025-04-03' --> 'data\processed_data\INTU\4_2025-04-03.md'
Converted 'data\edgar_documents\INTU\4_2025-05-06' --> 'data\processed_data\INTU\4_2025-05-06.md'


2025-11-14 16:52:27,562 - INFO - Finished converting document 4_2025-05-12 in 0.08 sec.
2025-11-14 16:52:27,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:27,625 - INFO - Going to convert document batch...
2025-11-14 16:52:27,627 - INFO - Processing document 4_2025-05-13
2025-11-14 16:52:27,656 - INFO - Finished converting document 4_2025-05-13 in 0.08 sec.
2025-11-14 16:52:27,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:27,750 - INFO - Going to convert document batch...
2025-11-14 16:52:27,752 - INFO - Processing document 4_2025-05-29


Converted 'data\edgar_documents\INTU\4_2025-05-12' --> 'data\processed_data\INTU\4_2025-05-12.md'
Converted 'data\edgar_documents\INTU\4_2025-05-13' --> 'data\processed_data\INTU\4_2025-05-13.md'


2025-11-14 16:52:27,843 - INFO - Finished converting document 4_2025-05-29 in 0.16 sec.
2025-11-14 16:52:27,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:27,963 - INFO - Going to convert document batch...
2025-11-14 16:52:27,963 - INFO - Processing document 4_2025-05-30
2025-11-14 16:52:28,004 - INFO - Finished converting document 4_2025-05-30 in 0.08 sec.
2025-11-14 16:52:28,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:28,097 - INFO - Going to convert document batch...
2025-11-14 16:52:28,097 - INFO - Processing document 4_2025-06-02


Converted 'data\edgar_documents\INTU\4_2025-05-29' --> 'data\processed_data\INTU\4_2025-05-29.md'
Converted 'data\edgar_documents\INTU\4_2025-05-30' --> 'data\processed_data\INTU\4_2025-05-30.md'


2025-11-14 16:52:28,121 - INFO - Finished converting document 4_2025-06-02 in 0.08 sec.
2025-11-14 16:52:28,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:28,188 - INFO - Going to convert document batch...
2025-11-14 16:52:28,189 - INFO - Processing document 4_2025-06-05
2025-11-14 16:52:28,222 - INFO - Finished converting document 4_2025-06-05 in 0.08 sec.
2025-11-14 16:52:28,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:28,304 - INFO - Going to convert document batch...
2025-11-14 16:52:28,305 - INFO - Processing document 4_2025-06-10


Converted 'data\edgar_documents\INTU\4_2025-06-02' --> 'data\processed_data\INTU\4_2025-06-02.md'
Converted 'data\edgar_documents\INTU\4_2025-06-05' --> 'data\processed_data\INTU\4_2025-06-05.md'


2025-11-14 16:52:28,350 - INFO - Finished converting document 4_2025-06-10 in 0.09 sec.
2025-11-14 16:52:28,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:28,429 - INFO - Going to convert document batch...
2025-11-14 16:52:28,430 - INFO - Processing document 4_2025-06-27
2025-11-14 16:52:28,457 - INFO - Finished converting document 4_2025-06-27 in 0.06 sec.
2025-11-14 16:52:28,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:28,526 - INFO - Going to convert document batch...
2025-11-14 16:52:28,527 - INFO - Processing document 4_2025-07-03
2025-11-14 16:52:28,587 - INFO - Finished converting document 4_2025-07-03 in 0.11 sec.


Converted 'data\edgar_documents\INTU\4_2025-06-10' --> 'data\processed_data\INTU\4_2025-06-10.md'
Converted 'data\edgar_documents\INTU\4_2025-06-27' --> 'data\processed_data\INTU\4_2025-06-27.md'


2025-11-14 16:52:28,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:28,682 - INFO - Going to convert document batch...
2025-11-14 16:52:28,683 - INFO - Processing document 4_2025-07-08
2025-11-14 16:52:28,725 - INFO - Finished converting document 4_2025-07-08 in 0.08 sec.
2025-11-14 16:52:28,793 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:28,802 - INFO - Going to convert document batch...
2025-11-14 16:52:28,803 - INFO - Processing document 4_2025-07-09


Converted 'data\edgar_documents\INTU\4_2025-07-03' --> 'data\processed_data\INTU\4_2025-07-03.md'
Converted 'data\edgar_documents\INTU\4_2025-07-08' --> 'data\processed_data\INTU\4_2025-07-08.md'


2025-11-14 16:52:28,830 - INFO - Finished converting document 4_2025-07-09 in 0.08 sec.
2025-11-14 16:52:28,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:28,892 - INFO - Going to convert document batch...
2025-11-14 16:52:28,893 - INFO - Processing document 4_2025-07-10
2025-11-14 16:52:28,917 - INFO - Finished converting document 4_2025-07-10 in 0.05 sec.
2025-11-14 16:52:28,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:28,976 - INFO - Going to convert document batch...
2025-11-14 16:52:28,976 - INFO - Processing document 4_2025-07-28
2025-11-14 16:52:29,001 - INFO - Finished converting document 4_2025-07-28 in 0.06 sec.
2025-11-14 16:52:29,059 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\4_2025-07-09' --> 'data\processed_data\INTU\4_2025-07-09.md'
Converted 'data\edgar_documents\INTU\4_2025-07-10' --> 'data\processed_data\INTU\4_2025-07-10.md'
Converted 'data\edgar_documents\INTU\4_2025-07-28' --> 'data\processed_data\INTU\4_2025-07-28.md'


2025-11-14 16:52:29,073 - INFO - Going to convert document batch...
2025-11-14 16:52:29,074 - INFO - Processing document 4_2025-07-29
2025-11-14 16:52:29,099 - INFO - Finished converting document 4_2025-07-29 in 0.06 sec.
2025-11-14 16:52:29,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:29,162 - INFO - Going to convert document batch...
2025-11-14 16:52:29,163 - INFO - Processing document 4_2025-07-31
2025-11-14 16:52:29,196 - INFO - Finished converting document 4_2025-07-31 in 0.06 sec.
2025-11-14 16:52:29,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:29,262 - INFO - Going to convert document batch...
2025-11-14 16:52:29,262 - INFO - Processing document 4_2025-08-12
2025-11-14 16:52:29,293 - INFO - Finished converting document 4_2025-08-12 in 0.08 sec.


Converted 'data\edgar_documents\INTU\4_2025-07-29' --> 'data\processed_data\INTU\4_2025-07-29.md'
Converted 'data\edgar_documents\INTU\4_2025-07-31' --> 'data\processed_data\INTU\4_2025-07-31.md'


2025-11-14 16:52:29,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:29,376 - INFO - Going to convert document batch...
2025-11-14 16:52:29,413 - INFO - Processing document 4_2025-08-14
2025-11-14 16:52:29,500 - INFO - Finished converting document 4_2025-08-14 in 0.17 sec.


Converted 'data\edgar_documents\INTU\4_2025-08-12' --> 'data\processed_data\INTU\4_2025-08-12.md'
Converted 'data\edgar_documents\INTU\4_2025-08-14' --> 'data\processed_data\INTU\4_2025-08-14.md'


2025-11-14 16:52:29,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:29,585 - INFO - Going to convert document batch...
2025-11-14 16:52:29,586 - INFO - Processing document 4_2025-08-26
2025-11-14 16:52:29,614 - INFO - Finished converting document 4_2025-08-26 in 0.08 sec.
2025-11-14 16:52:29,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:29,674 - INFO - Going to convert document batch...
2025-11-14 16:52:29,675 - INFO - Processing document 4_2025-09-03
2025-11-14 16:52:29,716 - INFO - Finished converting document 4_2025-09-03 in 0.08 sec.
2025-11-14 16:52:29,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:29,808 - INFO - Going to convert document batch...
2025-11-14 16:52:29,809 - INFO - Processing document 4_2025-09-11
2025-11-14 16:52:29,844 - INFO - Finished converting document 4_2025-09-11 in 0.09 sec.


Converted 'data\edgar_documents\INTU\4_2025-08-26' --> 'data\processed_data\INTU\4_2025-08-26.md'
Converted 'data\edgar_documents\INTU\4_2025-09-03' --> 'data\processed_data\INTU\4_2025-09-03.md'


2025-11-14 16:52:29,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:29,915 - INFO - Going to convert document batch...
2025-11-14 16:52:29,916 - INFO - Processing document 4_2025-10-02
2025-11-14 16:52:30,060 - INFO - Finished converting document 4_2025-10-02 in 0.19 sec.


Converted 'data\edgar_documents\INTU\4_2025-09-11' --> 'data\processed_data\INTU\4_2025-09-11.md'


2025-11-14 16:52:30,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:30,140 - INFO - Going to convert document batch...
2025-11-14 16:52:30,141 - INFO - Processing document 4_2025-10-07
2025-11-14 16:52:30,168 - INFO - Finished converting document 4_2025-10-07 in 0.06 sec.
2025-11-14 16:52:30,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:30,222 - INFO - Going to convert document batch...
2025-11-14 16:52:30,222 - INFO - Processing document 4_2025-10-21
2025-11-14 16:52:30,247 - INFO - Finished converting document 4_2025-10-21 in 0.05 sec.
2025-11-14 16:52:30,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:30,298 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTU\4_2025-10-02' --> 'data\processed_data\INTU\4_2025-10-02.md'
Converted 'data\edgar_documents\INTU\4_2025-10-07' --> 'data\processed_data\INTU\4_2025-10-07.md'
Converted 'data\edgar_documents\INTU\4_2025-10-21' --> 'data\processed_data\INTU\4_2025-10-21.md'


2025-11-14 16:52:30,298 - INFO - Processing document 4_2025-11-03
2025-11-14 16:52:30,329 - INFO - Finished converting document 4_2025-11-03 in 0.06 sec.
2025-11-14 16:52:30,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:30,476 - INFO - Going to convert document batch...
2025-11-14 16:52:30,476 - INFO - Processing document 4_2025-11-04
2025-11-14 16:52:30,500 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 16:52:30,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:30,596 - INFO - Going to convert document batch...
2025-11-14 16:52:30,597 - INFO - Processing document 8-K_2023-01-23
2025-11-14 16:52:30,632 - INFO - Finished converting document 8-K_2023-01-23 in 0.09 sec.


Converted 'data\edgar_documents\INTU\4_2025-11-03' --> 'data\processed_data\INTU\4_2025-11-03.md'
Converted 'data\edgar_documents\INTU\4_2025-11-04' --> 'data\processed_data\INTU\4_2025-11-04.md'


2025-11-14 16:52:30,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:30,687 - INFO - Going to convert document batch...
2025-11-14 16:52:30,688 - INFO - Processing document 8-K_2023-02-23
2025-11-14 16:52:30,717 - INFO - Finished converting document 8-K_2023-02-23 in 0.08 sec.
2025-11-14 16:52:30,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:30,792 - INFO - Going to convert document batch...
2025-11-14 16:52:30,793 - INFO - Processing document 8-K_2023-05-04
2025-11-14 16:52:30,814 - INFO - Finished converting document 8-K_2023-05-04 in 0.08 sec.


Converted 'data\edgar_documents\INTU\8-K_2023-01-23' --> 'data\processed_data\INTU\8-K_2023-01-23.md'
Converted 'data\edgar_documents\INTU\8-K_2023-02-23' --> 'data\processed_data\INTU\8-K_2023-02-23.md'


2025-11-14 16:52:30,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:30,872 - INFO - Going to convert document batch...
2025-11-14 16:52:30,873 - INFO - Processing document 8-K_2023-05-23
2025-11-14 16:52:30,898 - INFO - Finished converting document 8-K_2023-05-23 in 0.06 sec.


Converted 'data\edgar_documents\INTU\8-K_2023-05-04' --> 'data\processed_data\INTU\8-K_2023-05-04.md'
Converted 'data\edgar_documents\INTU\8-K_2023-05-23' --> 'data\processed_data\INTU\8-K_2023-05-23.md'


2025-11-14 16:52:31,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:31,072 - INFO - Going to convert document batch...
2025-11-14 16:52:31,073 - INFO - Processing document 8-K_2023-08-02
2025-11-14 16:52:31,094 - INFO - Finished converting document 8-K_2023-08-02 in 0.09 sec.
2025-11-14 16:52:31,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:31,156 - INFO - Going to convert document batch...
2025-11-14 16:52:31,157 - INFO - Processing document 8-K_2023-08-14
2025-11-14 16:52:31,177 - INFO - Finished converting document 8-K_2023-08-14 in 0.06 sec.
2025-11-14 16:52:31,215 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:31,231 - INFO - Going to convert document batch...
2025-11-14 16:52:31,232 - INFO - Processing document 8-K_2023-08-24
2025-11-14 16:52:31,255 - INFO - Finished converting document 8-K_2023-08-24 in 0.06 sec.


Converted 'data\edgar_documents\INTU\8-K_2023-08-02' --> 'data\processed_data\INTU\8-K_2023-08-02.md'
Converted 'data\edgar_documents\INTU\8-K_2023-08-14' --> 'data\processed_data\INTU\8-K_2023-08-14.md'
Converted 'data\edgar_documents\INTU\8-K_2023-08-24' --> 'data\processed_data\INTU\8-K_2023-08-24.md'


2025-11-14 16:52:31,296 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:31,314 - INFO - Going to convert document batch...
2025-11-14 16:52:31,315 - INFO - Processing document 8-K_2023-09-15
2025-11-14 16:52:31,343 - INFO - Finished converting document 8-K_2023-09-15 in 0.08 sec.
2025-11-14 16:52:31,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:31,467 - INFO - Going to convert document batch...
2025-11-14 16:52:31,468 - INFO - Processing document 8-K_2023-11-28
2025-11-14 16:52:31,487 - INFO - Finished converting document 8-K_2023-11-28 in 0.12 sec.
2025-11-14 16:52:31,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:31,552 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\INTU\8-K_2023-09-15' --> 'data\processed_data\INTU\8-K_2023-09-15.md'
Converted 'data\edgar_documents\INTU\8-K_2023-11-28' --> 'data\processed_data\INTU\8-K_2023-11-28.md'


2025-11-14 16:52:31,554 - INFO - Processing document 8-K_2024-01-22
2025-11-14 16:52:31,597 - INFO - Finished converting document 8-K_2024-01-22 in 0.09 sec.
2025-11-14 16:52:31,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:31,667 - INFO - Going to convert document batch...
2025-11-14 16:52:31,669 - INFO - Processing document 8-K_2024-02-22
2025-11-14 16:52:31,693 - INFO - Finished converting document 8-K_2024-02-22 in 0.08 sec.


Converted 'data\edgar_documents\INTU\8-K_2024-01-22' --> 'data\processed_data\INTU\8-K_2024-01-22.md'
Converted 'data\edgar_documents\INTU\8-K_2024-02-22' --> 'data\processed_data\INTU\8-K_2024-02-22.md'


2025-11-14 16:52:31,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:31,844 - INFO - Going to convert document batch...
2025-11-14 16:52:31,845 - INFO - Processing document 8-K_2024-05-02
2025-11-14 16:52:31,879 - INFO - Finished converting document 8-K_2024-05-02 in 0.17 sec.
2025-11-14 16:52:31,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:31,936 - INFO - Going to convert document batch...
2025-11-14 16:52:31,937 - INFO - Processing document 8-K_2024-05-23
2025-11-14 16:52:31,957 - INFO - Finished converting document 8-K_2024-05-23 in 0.06 sec.
2025-11-14 16:52:31,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:32,010 - INFO - Going to convert document batch...
2025-11-14 16:52:32,011 - INFO - Processing document 8-K_2024-07-10
2025-11-14 16:52:32,040 - INFO - Finished converting document 8-K_2024-07-10 in 0.06 sec.
2025-11-14 16:52:32,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\8-K_2024-05-02' --> 'data\processed_data\INTU\8-K_2024-05-02.md'
Converted 'data\edgar_documents\INTU\8-K_2024-05-23' --> 'data\processed_data\INTU\8-K_2024-05-23.md'
Converted 'data\edgar_documents\INTU\8-K_2024-07-10' --> 'data\processed_data\INTU\8-K_2024-07-10.md'


2025-11-14 16:52:32,104 - INFO - Going to convert document batch...
2025-11-14 16:52:32,105 - INFO - Processing document 8-K_2024-07-25
2025-11-14 16:52:32,137 - INFO - Finished converting document 8-K_2024-07-25 in 0.09 sec.
2025-11-14 16:52:32,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:32,195 - INFO - Going to convert document batch...
2025-11-14 16:52:32,196 - INFO - Processing document 8-K_2024-08-22
2025-11-14 16:52:32,219 - INFO - Finished converting document 8-K_2024-08-22 in 0.05 sec.
2025-11-14 16:52:32,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:32,279 - INFO - Going to convert document batch...
2025-11-14 16:52:32,280 - INFO - Processing document 8-K_2024-11-04
2025-11-14 16:52:32,300 - INFO - Finished converting document 8-K_2024-11-04 in 0.06 sec.
2025-11-14 16:52:32,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:32,337 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\INTU\8-K_2024-07-25' --> 'data\processed_data\INTU\8-K_2024-07-25.md'
Converted 'data\edgar_documents\INTU\8-K_2024-08-22' --> 'data\processed_data\INTU\8-K_2024-08-22.md'
Converted 'data\edgar_documents\INTU\8-K_2024-11-04' --> 'data\processed_data\INTU\8-K_2024-11-04.md'


2025-11-14 16:52:32,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:32,424 - INFO - Going to convert document batch...
2025-11-14 16:52:32,425 - INFO - Processing document 8-K_2025-01-27
2025-11-14 16:52:32,475 - INFO - Finished converting document 8-K_2025-01-27 in 0.09 sec.
2025-11-14 16:52:32,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:32,525 - INFO - Going to convert document batch...
2025-11-14 16:52:32,527 - INFO - Processing document 8-K_2025-01-31
2025-11-14 16:52:32,560 - INFO - Finished converting document 8-K_2025-01-31 in 0.08 sec.


Converted 'data\edgar_documents\INTU\8-K_2024-11-21' --> 'data\processed_data\INTU\8-K_2024-11-21.md'
Converted 'data\edgar_documents\INTU\8-K_2025-01-27' --> 'data\processed_data\INTU\8-K_2025-01-27.md'


2025-11-14 16:52:32,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\8-K_2025-01-31' --> 'data\processed_data\INTU\8-K_2025-01-31.md'


2025-11-14 16:52:32,909 - INFO - Going to convert document batch...
2025-11-14 16:52:32,911 - INFO - Processing document 8-K_2025-02-25
2025-11-14 16:52:32,934 - INFO - Finished converting document 8-K_2025-02-25 in 0.38 sec.
2025-11-14 16:52:32,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:33,001 - INFO - Going to convert document batch...
2025-11-14 16:52:33,002 - INFO - Processing document 8-K_2025-05-22
2025-11-14 16:52:33,025 - INFO - Finished converting document 8-K_2025-05-22 in 0.06 sec.
2025-11-14 16:52:33,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:33,086 - INFO - Going to convert document batch...
2025-11-14 16:52:33,088 - INFO - Processing document 8-K_2025-06-16
2025-11-14 16:52:33,110 - INFO - Finished converting document 8-K_2025-06-16 in 0.08 sec.


Converted 'data\edgar_documents\INTU\8-K_2025-02-25' --> 'data\processed_data\INTU\8-K_2025-02-25.md'
Converted 'data\edgar_documents\INTU\8-K_2025-05-22' --> 'data\processed_data\INTU\8-K_2025-05-22.md'
Converted 'data\edgar_documents\INTU\8-K_2025-06-16' --> 'data\processed_data\INTU\8-K_2025-06-16.md'


2025-11-14 16:52:33,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:33,183 - INFO - Going to convert document batch...
2025-11-14 16:52:33,185 - INFO - Processing document 8-K_2025-08-21
2025-11-14 16:52:33,222 - INFO - Finished converting document 8-K_2025-08-21 in 0.09 sec.
2025-11-14 16:52:33,314 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:52:33,315 - ERROR - Input document DEF-14A_2023-11-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>

Converted 'data\edgar_documents\INTU\8-K_2025-08-21' --> 'data\processed_data\INTU\8-K_2025-08-21.md'
Error processing data\edgar_documents\INTU\DEF-14A_2023-11-22: File format not allowed: data\edgar_documents\INTU\DEF-14A_2023-11-22


2025-11-14 16:52:33,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:52:34,004 - INFO - Going to convert document batch...
2025-11-14 16:52:34,004 - INFO - Processing document DEF-14A_2024-11-27
2025-11-14 16:52:36,909 - INFO - Finished converting document DEF-14A_2024-11-27 in 3.59 sec.
2025-11-14 16:52:38,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\INTU\DEF-14A_2024-11-27' --> 'data\processed_data\INTU\DEF-14A_2024-11-27.md'
Processed 147 new files. Errors: 3
Found 150 files to process in data\edgar_documents\ISRG


2025-11-14 16:52:38,823 - INFO - Going to convert document batch...
2025-11-14 16:52:38,824 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:52:38,825 - INFO - Processing document 10-K_2023-02-10
2025-11-14 16:52:40,369 - INFO - Finished converting document 10-K_2023-02-10 in 2.39 sec.
2025-11-14 16:52:40,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-K_2023-02-10' --> 'data\processed_data\ISRG\10-K_2023-02-10.md'


2025-11-14 16:52:41,959 - INFO - Going to convert document batch...
2025-11-14 16:52:41,960 - INFO - Processing document 10-K_2024-01-31
2025-11-14 16:52:43,406 - INFO - Finished converting document 10-K_2024-01-31 in 2.48 sec.
2025-11-14 16:52:44,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-K_2024-01-31' --> 'data\processed_data\ISRG\10-K_2024-01-31.md'


2025-11-14 16:52:45,155 - INFO - Going to convert document batch...
2025-11-14 16:52:45,156 - INFO - Processing document 10-K_2025-01-31
2025-11-14 16:52:46,612 - INFO - Finished converting document 10-K_2025-01-31 in 2.61 sec.
2025-11-14 16:52:47,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-K_2025-01-31' --> 'data\processed_data\ISRG\10-K_2025-01-31.md'


2025-11-14 16:52:47,675 - INFO - Going to convert document batch...
2025-11-14 16:52:47,675 - INFO - Processing document 10-Q_2023-04-20
2025-11-14 16:52:48,410 - INFO - Finished converting document 10-Q_2023-04-20 in 1.19 sec.
2025-11-14 16:52:48,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-Q_2023-04-20' --> 'data\processed_data\ISRG\10-Q_2023-04-20.md'


2025-11-14 16:52:49,884 - INFO - Going to convert document batch...
2025-11-14 16:52:49,885 - INFO - Processing document 10-Q_2023-07-24
2025-11-14 16:52:51,007 - INFO - Finished converting document 10-Q_2023-07-24 in 2.22 sec.
2025-11-14 16:52:51,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-Q_2023-07-24' --> 'data\processed_data\ISRG\10-Q_2023-07-24.md'


2025-11-14 16:52:52,594 - INFO - Going to convert document batch...
2025-11-14 16:52:52,595 - INFO - Processing document 10-Q_2023-10-20
2025-11-14 16:52:53,521 - INFO - Finished converting document 10-Q_2023-10-20 in 1.89 sec.
2025-11-14 16:52:54,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-Q_2023-10-20' --> 'data\processed_data\ISRG\10-Q_2023-10-20.md'


2025-11-14 16:52:54,705 - INFO - Going to convert document batch...
2025-11-14 16:52:54,706 - INFO - Processing document 10-Q_2024-04-19
2025-11-14 16:52:55,819 - INFO - Finished converting document 10-Q_2024-04-19 in 1.72 sec.
2025-11-14 16:52:56,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-Q_2024-04-19' --> 'data\processed_data\ISRG\10-Q_2024-04-19.md'


2025-11-14 16:52:57,346 - INFO - Going to convert document batch...
2025-11-14 16:52:57,347 - INFO - Processing document 10-Q_2024-07-19
2025-11-14 16:52:58,243 - INFO - Finished converting document 10-Q_2024-07-19 in 1.80 sec.
2025-11-14 16:52:58,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-Q_2024-07-19' --> 'data\processed_data\ISRG\10-Q_2024-07-19.md'


2025-11-14 16:52:59,427 - INFO - Going to convert document batch...
2025-11-14 16:52:59,428 - INFO - Processing document 10-Q_2024-10-18
2025-11-14 16:53:00,931 - INFO - Finished converting document 10-Q_2024-10-18 in 2.22 sec.
2025-11-14 16:53:01,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-Q_2024-10-18' --> 'data\processed_data\ISRG\10-Q_2024-10-18.md'


2025-11-14 16:53:01,947 - INFO - Going to convert document batch...
2025-11-14 16:53:01,948 - INFO - Processing document 10-Q_2025-04-23
2025-11-14 16:53:02,743 - INFO - Finished converting document 10-Q_2025-04-23 in 1.25 sec.


Converted 'data\edgar_documents\ISRG\10-Q_2025-04-23' --> 'data\processed_data\ISRG\10-Q_2025-04-23.md'


2025-11-14 16:53:03,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:03,911 - INFO - Going to convert document batch...
2025-11-14 16:53:03,912 - INFO - Processing document 10-Q_2025-07-23
2025-11-14 16:53:05,529 - INFO - Finished converting document 10-Q_2025-07-23 in 2.39 sec.
2025-11-14 16:53:06,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\10-Q_2025-07-23' --> 'data\processed_data\ISRG\10-Q_2025-07-23.md'


2025-11-14 16:53:06,676 - INFO - Going to convert document batch...
2025-11-14 16:53:06,676 - INFO - Processing document 10-Q_2025-10-22
2025-11-14 16:53:07,663 - INFO - Finished converting document 10-Q_2025-10-22 in 1.62 sec.
2025-11-14 16:53:08,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:08,201 - INFO - Going to convert document batch...
2025-11-14 16:53:08,201 - INFO - Processing document 4_2023-01-30
2025-11-14 16:53:08,230 - INFO - Finished converting document 4_2023-01-30 in 0.06 sec.
2025-11-14 16:53:08,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:08,293 - INFO - Going to convert document batch...
2025-11-14 16:53:08,294 - INFO - Processing document 4_2023-02-07
2025-11-14 16:53:08,322 - INFO - Finished converting document 4_2023-02-07 in 0.08 sec.


Converted 'data\edgar_documents\ISRG\10-Q_2025-10-22' --> 'data\processed_data\ISRG\10-Q_2025-10-22.md'
Converted 'data\edgar_documents\ISRG\4_2023-01-30' --> 'data\processed_data\ISRG\4_2023-01-30.md'
Converted 'data\edgar_documents\ISRG\4_2023-02-07' --> 'data\processed_data\ISRG\4_2023-02-07.md'


2025-11-14 16:53:08,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:08,389 - INFO - Going to convert document batch...
2025-11-14 16:53:08,390 - INFO - Processing document 4_2023-02-14
2025-11-14 16:53:08,416 - INFO - Finished converting document 4_2023-02-14 in 0.06 sec.
2025-11-14 16:53:08,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:08,573 - INFO - Going to convert document batch...
2025-11-14 16:53:08,574 - INFO - Processing document 4_2023-02-16
2025-11-14 16:53:08,600 - INFO - Finished converting document 4_2023-02-16 in 0.14 sec.
2025-11-14 16:53:08,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2023-02-14' --> 'data\processed_data\ISRG\4_2023-02-14.md'
Converted 'data\edgar_documents\ISRG\4_2023-02-16' --> 'data\processed_data\ISRG\4_2023-02-16.md'


2025-11-14 16:53:08,656 - INFO - Going to convert document batch...
2025-11-14 16:53:08,658 - INFO - Processing document 4_2023-02-27
2025-11-14 16:53:08,695 - INFO - Finished converting document 4_2023-02-27 in 0.06 sec.
2025-11-14 16:53:08,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:08,763 - INFO - Going to convert document batch...
2025-11-14 16:53:08,764 - INFO - Processing document 4_2023-03-01
2025-11-14 16:53:08,800 - INFO - Finished converting document 4_2023-03-01 in 0.08 sec.
2025-11-14 16:53:08,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:08,865 - INFO - Going to convert document batch...
2025-11-14 16:53:08,866 - INFO - Processing document 4_2023-04-24
2025-11-14 16:53:08,899 - INFO - Finished converting document 4_2023-04-24 in 0.06 sec.


Converted 'data\edgar_documents\ISRG\4_2023-02-27' --> 'data\processed_data\ISRG\4_2023-02-27.md'
Converted 'data\edgar_documents\ISRG\4_2023-03-01' --> 'data\processed_data\ISRG\4_2023-03-01.md'


2025-11-14 16:53:08,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:08,973 - INFO - Going to convert document batch...
2025-11-14 16:53:08,974 - INFO - Processing document 4_2023-04-28
2025-11-14 16:53:09,010 - INFO - Finished converting document 4_2023-04-28 in 0.09 sec.


Converted 'data\edgar_documents\ISRG\4_2023-04-24' --> 'data\processed_data\ISRG\4_2023-04-24.md'
Converted 'data\edgar_documents\ISRG\4_2023-04-28' --> 'data\processed_data\ISRG\4_2023-04-28.md'


2025-11-14 16:53:09,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:09,159 - INFO - Going to convert document batch...
2025-11-14 16:53:09,160 - INFO - Processing document 4_2023-05-01
2025-11-14 16:53:09,230 - INFO - Finished converting document 4_2023-05-01 in 0.16 sec.
2025-11-14 16:53:09,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:09,345 - INFO - Going to convert document batch...
2025-11-14 16:53:09,346 - INFO - Processing document 4_2023-05-02
2025-11-14 16:53:09,375 - INFO - Finished converting document 4_2023-05-02 in 0.09 sec.
2025-11-14 16:53:09,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:09,434 - INFO - Going to convert document batch...
2025-11-14 16:53:09,434 - INFO - Processing document 4_2023-05-03


Converted 'data\edgar_documents\ISRG\4_2023-05-01' --> 'data\processed_data\ISRG\4_2023-05-01.md'
Converted 'data\edgar_documents\ISRG\4_2023-05-02' --> 'data\processed_data\ISRG\4_2023-05-02.md'


2025-11-14 16:53:09,908 - INFO - Finished converting document 4_2023-05-03 in 0.50 sec.
2025-11-14 16:53:09,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:10,008 - INFO - Going to convert document batch...
2025-11-14 16:53:10,008 - INFO - Processing document 4_2023-05-12
2025-11-14 16:53:10,034 - INFO - Finished converting document 4_2023-05-12 in 0.08 sec.
2025-11-14 16:53:10,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:10,096 - INFO - Going to convert document batch...
2025-11-14 16:53:10,097 - INFO - Processing document 4_2023-06-15
2025-11-14 16:53:10,119 - INFO - Finished converting document 4_2023-06-15 in 0.05 sec.


Converted 'data\edgar_documents\ISRG\4_2023-05-03' --> 'data\processed_data\ISRG\4_2023-05-03.md'
Converted 'data\edgar_documents\ISRG\4_2023-05-12' --> 'data\processed_data\ISRG\4_2023-05-12.md'


2025-11-14 16:53:10,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:10,277 - INFO - Going to convert document batch...
2025-11-14 16:53:10,279 - INFO - Processing document 4_2023-07-26


Converted 'data\edgar_documents\ISRG\4_2023-06-15' --> 'data\processed_data\ISRG\4_2023-06-15.md'


2025-11-14 16:53:10,340 - INFO - Finished converting document 4_2023-07-26 in 0.20 sec.
2025-11-14 16:53:10,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:10,499 - INFO - Going to convert document batch...
2025-11-14 16:53:10,501 - INFO - Processing document 4_2023-08-01
2025-11-14 16:53:10,540 - INFO - Finished converting document 4_2023-08-01 in 0.14 sec.


Converted 'data\edgar_documents\ISRG\4_2023-07-26' --> 'data\processed_data\ISRG\4_2023-07-26.md'
Converted 'data\edgar_documents\ISRG\4_2023-08-01' --> 'data\processed_data\ISRG\4_2023-08-01.md'


2025-11-14 16:53:10,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:10,649 - INFO - Going to convert document batch...
2025-11-14 16:53:10,650 - INFO - Processing document 4_2023-08-08
2025-11-14 16:53:10,691 - INFO - Finished converting document 4_2023-08-08 in 0.12 sec.
2025-11-14 16:53:10,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:10,746 - INFO - Going to convert document batch...
2025-11-14 16:53:10,747 - INFO - Processing document 4_2023-08-11
2025-11-14 16:53:10,767 - INFO - Finished converting document 4_2023-08-11 in 0.05 sec.
2025-11-14 16:53:10,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:10,840 - INFO - Going to convert document batch...
2025-11-14 16:53:10,841 - INFO - Processing document 4_2023-08-14
2025-11-14 16:53:10,865 - INFO - Finished converting document 4_2023-08-14 in 0.06 sec.
2025-11-14 16:53:10,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\ISRG\4_2023-08-08' --> 'data\processed_data\ISRG\4_2023-08-08.md'
Converted 'data\edgar_documents\ISRG\4_2023-08-11' --> 'data\processed_data\ISRG\4_2023-08-11.md'
Converted 'data\edgar_documents\ISRG\4_2023-08-14' --> 'data\processed_data\ISRG\4_2023-08-14.md'


2025-11-14 16:53:10,907 - INFO - Processing document 4_2023-09-15
2025-11-14 16:53:10,933 - INFO - Finished converting document 4_2023-09-15 in 0.05 sec.
2025-11-14 16:53:10,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:10,995 - INFO - Going to convert document batch...
2025-11-14 16:53:10,996 - INFO - Processing document 4_2023-10-12
2025-11-14 16:53:11,019 - INFO - Finished converting document 4_2023-10-12 in 0.06 sec.
2025-11-14 16:53:11,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:11,091 - INFO - Going to convert document batch...
2025-11-14 16:53:11,092 - INFO - Processing document 4_2023-10-25
2025-11-14 16:53:11,137 - INFO - Finished converting document 4_2023-10-25 in 0.09 sec.


Converted 'data\edgar_documents\ISRG\4_2023-09-15' --> 'data\processed_data\ISRG\4_2023-09-15.md'
Converted 'data\edgar_documents\ISRG\4_2023-10-12' --> 'data\processed_data\ISRG\4_2023-10-12.md'


2025-11-14 16:53:11,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:11,282 - INFO - Going to convert document batch...
2025-11-14 16:53:11,285 - INFO - Processing document 4_2023-10-26
2025-11-14 16:53:11,324 - INFO - Finished converting document 4_2023-10-26 in 0.17 sec.


Converted 'data\edgar_documents\ISRG\4_2023-10-25' --> 'data\processed_data\ISRG\4_2023-10-25.md'


2025-11-14 16:53:11,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:11,398 - INFO - Going to convert document batch...
2025-11-14 16:53:11,399 - INFO - Processing document 4_2023-11-13
2025-11-14 16:53:11,446 - INFO - Finished converting document 4_2023-11-13 in 0.08 sec.
2025-11-14 16:53:11,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2023-10-26' --> 'data\processed_data\ISRG\4_2023-10-26.md'
Converted 'data\edgar_documents\ISRG\4_2023-11-13' --> 'data\processed_data\ISRG\4_2023-11-13.md'


2025-11-14 16:53:11,582 - INFO - Going to convert document batch...
2025-11-14 16:53:11,583 - INFO - Processing document 4_2023-11-15
2025-11-14 16:53:11,646 - INFO - Finished converting document 4_2023-11-15 in 0.16 sec.
2025-11-14 16:53:11,746 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:11,761 - INFO - Going to convert document batch...
2025-11-14 16:53:11,762 - INFO - Processing document 4_2023-11-17
2025-11-14 16:53:11,788 - INFO - Finished converting document 4_2023-11-17 in 0.05 sec.
2025-11-14 16:53:11,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:11,856 - INFO - Going to convert document batch...
2025-11-14 16:53:11,857 - INFO - Processing document 4_2023-12-14
2025-11-14 16:53:11,892 - INFO - Finished converting document 4_2023-12-14 in 0.08 sec.
2025-11-14 16:53:11,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2023-11-15' --> 'data\processed_data\ISRG\4_2023-11-15.md'
Converted 'data\edgar_documents\ISRG\4_2023-11-17' --> 'data\processed_data\ISRG\4_2023-11-17.md'
Converted 'data\edgar_documents\ISRG\4_2023-12-14' --> 'data\processed_data\ISRG\4_2023-12-14.md'


2025-11-14 16:53:11,946 - INFO - Going to convert document batch...
2025-11-14 16:53:11,947 - INFO - Processing document 4_2024-01-29
2025-11-14 16:53:11,982 - INFO - Finished converting document 4_2024-01-29 in 0.08 sec.
2025-11-14 16:53:12,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:12,065 - INFO - Going to convert document batch...
2025-11-14 16:53:12,067 - INFO - Processing document 4_2024-01-30
2025-11-14 16:53:12,097 - INFO - Finished converting document 4_2024-01-30 in 0.08 sec.
2025-11-14 16:53:12,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:12,164 - INFO - Going to convert document batch...
2025-11-14 16:53:12,165 - INFO - Processing document 4_2024-02-05
2025-11-14 16:53:12,191 - INFO - Finished converting document 4_2024-02-05 in 0.06 sec.


Converted 'data\edgar_documents\ISRG\4_2024-01-29' --> 'data\processed_data\ISRG\4_2024-01-29.md'
Converted 'data\edgar_documents\ISRG\4_2024-01-30' --> 'data\processed_data\ISRG\4_2024-01-30.md'
Converted 'data\edgar_documents\ISRG\4_2024-02-05' --> 'data\processed_data\ISRG\4_2024-02-05.md'


2025-11-14 16:53:12,251 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:12,283 - INFO - Going to convert document batch...
2025-11-14 16:53:12,284 - INFO - Processing document 4_2024-02-08
2025-11-14 16:53:12,351 - INFO - Finished converting document 4_2024-02-08 in 0.14 sec.
2025-11-14 16:53:12,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:12,447 - INFO - Going to convert document batch...
2025-11-14 16:53:12,448 - INFO - Processing document 4_2024-02-12
2025-11-14 16:53:12,474 - INFO - Finished converting document 4_2024-02-12 in 0.08 sec.
2025-11-14 16:53:12,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:12,546 - INFO - Going to convert document batch...
2025-11-14 16:53:12,548 - INFO - Processing document 4_2024-02-13
2025-11-14 16:53:12,568 - INFO - Finished converting document 4_2024-02-13 in 0.06 sec.


Converted 'data\edgar_documents\ISRG\4_2024-02-08' --> 'data\processed_data\ISRG\4_2024-02-08.md'
Converted 'data\edgar_documents\ISRG\4_2024-02-12' --> 'data\processed_data\ISRG\4_2024-02-12.md'


2025-11-14 16:53:12,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:12,616 - INFO - Going to convert document batch...
2025-11-14 16:53:12,617 - INFO - Processing document 4_2024-02-15
2025-11-14 16:53:12,648 - INFO - Finished converting document 4_2024-02-15 in 0.05 sec.
2025-11-14 16:53:12,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:12,712 - INFO - Going to convert document batch...
2025-11-14 16:53:12,713 - INFO - Processing document 4_2024-02-16
2025-11-14 16:53:12,776 - INFO - Finished converting document 4_2024-02-16 in 0.11 sec.


Converted 'data\edgar_documents\ISRG\4_2024-02-13' --> 'data\processed_data\ISRG\4_2024-02-13.md'
Converted 'data\edgar_documents\ISRG\4_2024-02-15' --> 'data\processed_data\ISRG\4_2024-02-15.md'


2025-11-14 16:53:12,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:12,848 - INFO - Going to convert document batch...
2025-11-14 16:53:12,849 - INFO - Processing document 4_2024-02-26
2025-11-14 16:53:12,876 - INFO - Finished converting document 4_2024-02-26 in 0.06 sec.
2025-11-14 16:53:12,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:12,937 - INFO - Going to convert document batch...
2025-11-14 16:53:12,938 - INFO - Processing document 4_2024-02-27
2025-11-14 16:53:12,966 - INFO - Finished converting document 4_2024-02-27 in 0.06 sec.


Converted 'data\edgar_documents\ISRG\4_2024-02-16' --> 'data\processed_data\ISRG\4_2024-02-16.md'
Converted 'data\edgar_documents\ISRG\4_2024-02-26' --> 'data\processed_data\ISRG\4_2024-02-26.md'
Converted 'data\edgar_documents\ISRG\4_2024-02-27' --> 'data\processed_data\ISRG\4_2024-02-27.md'


2025-11-14 16:53:13,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:13,043 - INFO - Going to convert document batch...
2025-11-14 16:53:13,044 - INFO - Processing document 4_2024-02-29
2025-11-14 16:53:13,086 - INFO - Finished converting document 4_2024-02-29 in 0.09 sec.
2025-11-14 16:53:13,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:13,151 - INFO - Going to convert document batch...
2025-11-14 16:53:13,152 - INFO - Processing document 4_2024-03-01
2025-11-14 16:53:13,173 - INFO - Finished converting document 4_2024-03-01 in 0.06 sec.
2025-11-14 16:53:13,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:13,247 - INFO - Going to convert document batch...
2025-11-14 16:53:13,248 - INFO - Processing document 4_2024-03-07
2025-11-14 16:53:13,275 - INFO - Finished converting document 4_2024-03-07 in 0.06 sec.


Converted 'data\edgar_documents\ISRG\4_2024-02-29' --> 'data\processed_data\ISRG\4_2024-02-29.md'
Converted 'data\edgar_documents\ISRG\4_2024-03-01' --> 'data\processed_data\ISRG\4_2024-03-01.md'


2025-11-14 16:53:13,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:13,366 - INFO - Going to convert document batch...
2025-11-14 16:53:13,368 - INFO - Processing document 4_2024-03-11
2025-11-14 16:53:13,473 - INFO - Finished converting document 4_2024-03-11 in 0.17 sec.


Converted 'data\edgar_documents\ISRG\4_2024-03-07' --> 'data\processed_data\ISRG\4_2024-03-07.md'


2025-11-14 16:53:13,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:13,602 - INFO - Going to convert document batch...
2025-11-14 16:53:13,603 - INFO - Processing document 4_2024-03-18


Converted 'data\edgar_documents\ISRG\4_2024-03-11' --> 'data\processed_data\ISRG\4_2024-03-11.md'


2025-11-14 16:53:13,735 - INFO - Finished converting document 4_2024-03-18 in 0.20 sec.
2025-11-14 16:53:13,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:13,833 - INFO - Going to convert document batch...
2025-11-14 16:53:13,834 - INFO - Processing document 4_2024-04-24
2025-11-14 16:53:13,863 - INFO - Finished converting document 4_2024-04-24 in 0.05 sec.
2025-11-14 16:53:13,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:13,916 - INFO - Going to convert document batch...
2025-11-14 16:53:13,917 - INFO - Processing document 4_2024-04-26
2025-11-14 16:53:13,944 - INFO - Finished converting document 4_2024-04-26 in 0.06 sec.
2025-11-14 16:53:13,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:14,002 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ISRG\4_2024-03-18' --> 'data\processed_data\ISRG\4_2024-03-18.md'
Converted 'data\edgar_documents\ISRG\4_2024-04-24' --> 'data\processed_data\ISRG\4_2024-04-24.md'
Converted 'data\edgar_documents\ISRG\4_2024-04-26' --> 'data\processed_data\ISRG\4_2024-04-26.md'


2025-11-14 16:53:14,004 - INFO - Processing document 4_2024-04-29
2025-11-14 16:53:14,039 - INFO - Finished converting document 4_2024-04-29 in 0.06 sec.
2025-11-14 16:53:14,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:14,127 - INFO - Going to convert document batch...
2025-11-14 16:53:14,128 - INFO - Processing document 4_2024-04-30
2025-11-14 16:53:14,190 - INFO - Finished converting document 4_2024-04-30 in 0.12 sec.


Converted 'data\edgar_documents\ISRG\4_2024-04-29' --> 'data\processed_data\ISRG\4_2024-04-29.md'
Converted 'data\edgar_documents\ISRG\4_2024-04-30' --> 'data\processed_data\ISRG\4_2024-04-30.md'


2025-11-14 16:53:14,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:14,278 - INFO - Going to convert document batch...
2025-11-14 16:53:14,279 - INFO - Processing document 4_2024-05-06
2025-11-14 16:53:14,404 - INFO - Finished converting document 4_2024-05-06 in 0.17 sec.
2025-11-14 16:53:14,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:14,506 - INFO - Going to convert document batch...
2025-11-14 16:53:14,507 - INFO - Processing document 4_2024-05-14
2025-11-14 16:53:14,548 - INFO - Finished converting document 4_2024-05-14 in 0.11 sec.
2025-11-14 16:53:14,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:14,631 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ISRG\4_2024-05-06' --> 'data\processed_data\ISRG\4_2024-05-06.md'
Converted 'data\edgar_documents\ISRG\4_2024-05-14' --> 'data\processed_data\ISRG\4_2024-05-14.md'


2025-11-14 16:53:14,632 - INFO - Processing document 4_2024-05-15
2025-11-14 16:53:14,657 - INFO - Finished converting document 4_2024-05-15 in 0.08 sec.
2025-11-14 16:53:14,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:14,726 - INFO - Going to convert document batch...
2025-11-14 16:53:14,727 - INFO - Processing document 4_2024-05-17
2025-11-14 16:53:14,757 - INFO - Finished converting document 4_2024-05-17 in 0.06 sec.
2025-11-14 16:53:14,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:14,840 - INFO - Going to convert document batch...
2025-11-14 16:53:14,842 - INFO - Processing document 4_2024-05-30
2025-11-14 16:53:14,881 - INFO - Finished converting document 4_2024-05-30 in 0.09 sec.


Converted 'data\edgar_documents\ISRG\4_2024-05-15' --> 'data\processed_data\ISRG\4_2024-05-15.md'
Converted 'data\edgar_documents\ISRG\4_2024-05-17' --> 'data\processed_data\ISRG\4_2024-05-17.md'


2025-11-14 16:53:14,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2024-05-30' --> 'data\processed_data\ISRG\4_2024-05-30.md'


2025-11-14 16:53:15,312 - INFO - Going to convert document batch...
2025-11-14 16:53:15,313 - INFO - Processing document 4_2024-06-03
2025-11-14 16:53:15,372 - INFO - Finished converting document 4_2024-06-03 in 0.47 sec.
2025-11-14 16:53:15,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:15,477 - INFO - Going to convert document batch...
2025-11-14 16:53:15,479 - INFO - Processing document 4_2024-06-06
2025-11-14 16:53:15,510 - INFO - Finished converting document 4_2024-06-06 in 0.09 sec.
2025-11-14 16:53:15,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:15,576 - INFO - Going to convert document batch...
2025-11-14 16:53:15,577 - INFO - Processing document 4_2024-06-10
2025-11-14 16:53:15,605 - INFO - Finished converting document 4_2024-06-10 in 0.08 sec.


Converted 'data\edgar_documents\ISRG\4_2024-06-03' --> 'data\processed_data\ISRG\4_2024-06-03.md'
Converted 'data\edgar_documents\ISRG\4_2024-06-06' --> 'data\processed_data\ISRG\4_2024-06-06.md'


2025-11-14 16:53:15,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:15,675 - INFO - Going to convert document batch...
2025-11-14 16:53:15,676 - INFO - Processing document 4_2024-06-11
2025-11-14 16:53:15,721 - INFO - Finished converting document 4_2024-06-11 in 0.08 sec.


Converted 'data\edgar_documents\ISRG\4_2024-06-10' --> 'data\processed_data\ISRG\4_2024-06-10.md'
Converted 'data\edgar_documents\ISRG\4_2024-06-11' --> 'data\processed_data\ISRG\4_2024-06-11.md'


2025-11-14 16:53:15,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:15,886 - INFO - Going to convert document batch...
2025-11-14 16:53:15,887 - INFO - Processing document 4_2024-06-12
2025-11-14 16:53:15,917 - INFO - Finished converting document 4_2024-06-12 in 0.17 sec.
2025-11-14 16:53:15,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:15,988 - INFO - Going to convert document batch...
2025-11-14 16:53:15,988 - INFO - Processing document 4_2024-07-24
2025-11-14 16:53:16,015 - INFO - Finished converting document 4_2024-07-24 in 0.06 sec.
2025-11-14 16:53:16,059 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:16,089 - INFO - Going to convert document batch...
2025-11-14 16:53:16,089 - INFO - Processing document 4_2024-07-30


Converted 'data\edgar_documents\ISRG\4_2024-06-12' --> 'data\processed_data\ISRG\4_2024-06-12.md'
Converted 'data\edgar_documents\ISRG\4_2024-07-24' --> 'data\processed_data\ISRG\4_2024-07-24.md'


2025-11-14 16:53:16,159 - INFO - Finished converting document 4_2024-07-30 in 0.11 sec.
2025-11-14 16:53:16,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:16,395 - INFO - Going to convert document batch...
2025-11-14 16:53:16,397 - INFO - Processing document 4_2024-07-31
2025-11-14 16:53:16,430 - INFO - Finished converting document 4_2024-07-31 in 0.11 sec.
2025-11-14 16:53:16,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:16,490 - INFO - Going to convert document batch...
2025-11-14 16:53:16,490 - INFO - Processing document 4_2024-08-05


Converted 'data\edgar_documents\ISRG\4_2024-07-30' --> 'data\processed_data\ISRG\4_2024-07-30.md'
Converted 'data\edgar_documents\ISRG\4_2024-07-31' --> 'data\processed_data\ISRG\4_2024-07-31.md'


2025-11-14 16:53:16,522 - INFO - Finished converting document 4_2024-08-05 in 0.06 sec.
2025-11-14 16:53:16,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:16,592 - INFO - Going to convert document batch...
2025-11-14 16:53:16,593 - INFO - Processing document 4_2024-08-13
2025-11-14 16:53:16,640 - INFO - Finished converting document 4_2024-08-13 in 0.09 sec.
2025-11-14 16:53:16,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:16,705 - INFO - Going to convert document batch...
2025-11-14 16:53:16,706 - INFO - Processing document 4_2024-08-26


Converted 'data\edgar_documents\ISRG\4_2024-08-05' --> 'data\processed_data\ISRG\4_2024-08-05.md'
Converted 'data\edgar_documents\ISRG\4_2024-08-13' --> 'data\processed_data\ISRG\4_2024-08-13.md'


2025-11-14 16:53:16,737 - INFO - Finished converting document 4_2024-08-26 in 0.06 sec.
2025-11-14 16:53:16,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:16,813 - INFO - Going to convert document batch...
2025-11-14 16:53:16,814 - INFO - Processing document 4_2024-08-29
2025-11-14 16:53:16,889 - INFO - Finished converting document 4_2024-08-29 in 0.12 sec.
2025-11-14 16:53:16,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2024-08-26' --> 'data\processed_data\ISRG\4_2024-08-26.md'
Converted 'data\edgar_documents\ISRG\4_2024-08-29' --> 'data\processed_data\ISRG\4_2024-08-29.md'


2025-11-14 16:53:16,990 - INFO - Going to convert document batch...
2025-11-14 16:53:16,991 - INFO - Processing document 4_2024-09-03
2025-11-14 16:53:17,028 - INFO - Finished converting document 4_2024-09-03 in 0.09 sec.
2025-11-14 16:53:17,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:17,092 - INFO - Going to convert document batch...
2025-11-14 16:53:17,093 - INFO - Processing document 4_2024-09-09
2025-11-14 16:53:17,116 - INFO - Finished converting document 4_2024-09-09 in 0.06 sec.
2025-11-14 16:53:17,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:17,161 - INFO - Going to convert document batch...
2025-11-14 16:53:17,162 - INFO - Processing document 4_2024-09-10
2025-11-14 16:53:17,192 - INFO - Finished converting document 4_2024-09-10 in 0.05 sec.
2025-11-14 16:53:17,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2024-09-03' --> 'data\processed_data\ISRG\4_2024-09-03.md'
Converted 'data\edgar_documents\ISRG\4_2024-09-09' --> 'data\processed_data\ISRG\4_2024-09-09.md'
Converted 'data\edgar_documents\ISRG\4_2024-09-10' --> 'data\processed_data\ISRG\4_2024-09-10.md'


2025-11-14 16:53:17,257 - INFO - Going to convert document batch...
2025-11-14 16:53:17,258 - INFO - Processing document 4_2024-09-16
2025-11-14 16:53:17,278 - INFO - Finished converting document 4_2024-09-16 in 0.06 sec.
2025-11-14 16:53:17,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:17,342 - INFO - Going to convert document batch...
2025-11-14 16:53:17,343 - INFO - Processing document 4_2024-10-10
2025-11-14 16:53:17,365 - INFO - Finished converting document 4_2024-10-10 in 0.06 sec.
2025-11-14 16:53:17,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:17,421 - INFO - Going to convert document batch...
2025-11-14 16:53:17,421 - INFO - Processing document 4_2024-10-23
2025-11-14 16:53:17,443 - INFO - Finished converting document 4_2024-10-23 in 0.05 sec.
2025-11-14 16:53:17,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2024-09-16' --> 'data\processed_data\ISRG\4_2024-09-16.md'
Converted 'data\edgar_documents\ISRG\4_2024-10-10' --> 'data\processed_data\ISRG\4_2024-10-10.md'
Converted 'data\edgar_documents\ISRG\4_2024-10-23' --> 'data\processed_data\ISRG\4_2024-10-23.md'


2025-11-14 16:53:17,524 - INFO - Going to convert document batch...
2025-11-14 16:53:17,524 - INFO - Processing document 4_2024-10-24
2025-11-14 16:53:17,568 - INFO - Finished converting document 4_2024-10-24 in 0.09 sec.
2025-11-14 16:53:17,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:17,653 - INFO - Going to convert document batch...
2025-11-14 16:53:17,655 - INFO - Processing document 4_2024-10-28
2025-11-14 16:53:17,678 - INFO - Finished converting document 4_2024-10-28 in 0.08 sec.
2025-11-14 16:53:17,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:17,772 - INFO - Going to convert document batch...
2025-11-14 16:53:17,773 - INFO - Processing document 4_2024-10-29


Converted 'data\edgar_documents\ISRG\4_2024-10-24' --> 'data\processed_data\ISRG\4_2024-10-24.md'
Converted 'data\edgar_documents\ISRG\4_2024-10-28' --> 'data\processed_data\ISRG\4_2024-10-28.md'


2025-11-14 16:53:17,926 - INFO - Finished converting document 4_2024-10-29 in 0.16 sec.
2025-11-14 16:53:18,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:18,065 - INFO - Going to convert document batch...
2025-11-14 16:53:18,065 - INFO - Processing document 4_2024-10-31
2025-11-14 16:53:18,094 - INFO - Finished converting document 4_2024-10-31 in 0.09 sec.
2025-11-14 16:53:18,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:18,180 - INFO - Going to convert document batch...
2025-11-14 16:53:18,182 - INFO - Processing document 4_2024-11-05


Converted 'data\edgar_documents\ISRG\4_2024-10-29' --> 'data\processed_data\ISRG\4_2024-10-29.md'
Converted 'data\edgar_documents\ISRG\4_2024-10-31' --> 'data\processed_data\ISRG\4_2024-10-31.md'


2025-11-14 16:53:18,209 - INFO - Finished converting document 4_2024-11-05 in 0.08 sec.
2025-11-14 16:53:18,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:18,378 - INFO - Going to convert document batch...
2025-11-14 16:53:18,379 - INFO - Processing document 4_2024-11-12


Converted 'data\edgar_documents\ISRG\4_2024-11-05' --> 'data\processed_data\ISRG\4_2024-11-05.md'


2025-11-14 16:53:18,459 - INFO - Finished converting document 4_2024-11-12 in 0.22 sec.
2025-11-14 16:53:18,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:18,598 - INFO - Going to convert document batch...
2025-11-14 16:53:18,599 - INFO - Processing document 4_2024-11-13
2025-11-14 16:53:18,643 - INFO - Finished converting document 4_2024-11-13 in 0.11 sec.


Converted 'data\edgar_documents\ISRG\4_2024-11-12' --> 'data\processed_data\ISRG\4_2024-11-12.md'
Converted 'data\edgar_documents\ISRG\4_2024-11-13' --> 'data\processed_data\ISRG\4_2024-11-13.md'


2025-11-14 16:53:18,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:18,760 - INFO - Going to convert document batch...
2025-11-14 16:53:18,762 - INFO - Processing document 4_2024-11-22
2025-11-14 16:53:18,797 - INFO - Finished converting document 4_2024-11-22 in 0.12 sec.
2025-11-14 16:53:18,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:18,880 - INFO - Going to convert document batch...
2025-11-14 16:53:18,881 - INFO - Processing document 4_2024-11-26
2025-11-14 16:53:18,912 - INFO - Finished converting document 4_2024-11-26 in 0.09 sec.
2025-11-14 16:53:18,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:18,985 - INFO - Going to convert document batch...
2025-11-14 16:53:18,987 - INFO - Processing document 4_2024-12-02


Converted 'data\edgar_documents\ISRG\4_2024-11-22' --> 'data\processed_data\ISRG\4_2024-11-22.md'
Converted 'data\edgar_documents\ISRG\4_2024-11-26' --> 'data\processed_data\ISRG\4_2024-11-26.md'


2025-11-14 16:53:19,031 - INFO - Finished converting document 4_2024-12-02 in 0.08 sec.
2025-11-14 16:53:19,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:19,098 - INFO - Going to convert document batch...
2025-11-14 16:53:19,099 - INFO - Processing document 4_2024-12-11
2025-11-14 16:53:19,238 - INFO - Finished converting document 4_2024-12-11 in 0.17 sec.


Converted 'data\edgar_documents\ISRG\4_2024-12-02' --> 'data\processed_data\ISRG\4_2024-12-02.md'
Converted 'data\edgar_documents\ISRG\4_2024-12-11' --> 'data\processed_data\ISRG\4_2024-12-11.md'


2025-11-14 16:53:19,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:19,332 - INFO - Going to convert document batch...
2025-11-14 16:53:19,333 - INFO - Processing document 4_2025-01-28
2025-11-14 16:53:19,363 - INFO - Finished converting document 4_2025-01-28 in 0.09 sec.
2025-11-14 16:53:19,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:19,444 - INFO - Going to convert document batch...
2025-11-14 16:53:19,445 - INFO - Processing document 4_2025-01-29
2025-11-14 16:53:19,509 - INFO - Finished converting document 4_2025-01-29 in 0.11 sec.


Converted 'data\edgar_documents\ISRG\4_2025-01-28' --> 'data\processed_data\ISRG\4_2025-01-28.md'
Converted 'data\edgar_documents\ISRG\4_2025-01-29' --> 'data\processed_data\ISRG\4_2025-01-29.md'


2025-11-14 16:53:19,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:19,629 - INFO - Going to convert document batch...
2025-11-14 16:53:19,629 - INFO - Processing document 4_2025-02-10
2025-11-14 16:53:19,748 - INFO - Finished converting document 4_2025-02-10 in 0.19 sec.
2025-11-14 16:53:19,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:19,817 - INFO - Going to convert document batch...
2025-11-14 16:53:19,818 - INFO - Processing document 4_2025-02-11
2025-11-14 16:53:19,851 - INFO - Finished converting document 4_2025-02-11 in 0.06 sec.
2025-11-14 16:53:19,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:19,915 - INFO - Going to convert document batch...
2025-11-14 16:53:19,916 - INFO - Processing document 4_2025-02-12
2025-11-14 16:53:19,943 - INFO - Finished converting document 4_2025-02-12 in 0.06 sec.
2025-11-14 16:53:19,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2025-02-10' --> 'data\processed_data\ISRG\4_2025-02-10.md'
Converted 'data\edgar_documents\ISRG\4_2025-02-11' --> 'data\processed_data\ISRG\4_2025-02-11.md'
Converted 'data\edgar_documents\ISRG\4_2025-02-12' --> 'data\processed_data\ISRG\4_2025-02-12.md'


2025-11-14 16:53:20,021 - INFO - Going to convert document batch...
2025-11-14 16:53:20,023 - INFO - Processing document 4_2025-02-26
2025-11-14 16:53:20,076 - INFO - Finished converting document 4_2025-02-26 in 0.11 sec.
2025-11-14 16:53:20,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:20,151 - INFO - Going to convert document batch...
2025-11-14 16:53:20,152 - INFO - Processing document 4_2025-02-27
2025-11-14 16:53:20,182 - INFO - Finished converting document 4_2025-02-27 in 0.06 sec.
2025-11-14 16:53:20,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:20,248 - INFO - Going to convert document batch...
2025-11-14 16:53:20,250 - INFO - Processing document 4_2025-02-28


Converted 'data\edgar_documents\ISRG\4_2025-02-26' --> 'data\processed_data\ISRG\4_2025-02-26.md'
Converted 'data\edgar_documents\ISRG\4_2025-02-27' --> 'data\processed_data\ISRG\4_2025-02-27.md'


2025-11-14 16:53:20,587 - INFO - Finished converting document 4_2025-02-28 in 0.38 sec.
2025-11-14 16:53:20,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:20,665 - INFO - Going to convert document batch...
2025-11-14 16:53:20,665 - INFO - Processing document 4_2025-03-03
2025-11-14 16:53:20,699 - INFO - Finished converting document 4_2025-03-03 in 0.09 sec.
2025-11-14 16:53:20,746 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:20,759 - INFO - Going to convert document batch...
2025-11-14 16:53:20,760 - INFO - Processing document 4_2025-03-06
2025-11-14 16:53:20,783 - INFO - Finished converting document 4_2025-03-06 in 0.06 sec.


Converted 'data\edgar_documents\ISRG\4_2025-02-28' --> 'data\processed_data\ISRG\4_2025-02-28.md'
Converted 'data\edgar_documents\ISRG\4_2025-03-03' --> 'data\processed_data\ISRG\4_2025-03-03.md'
Converted 'data\edgar_documents\ISRG\4_2025-03-06' --> 'data\processed_data\ISRG\4_2025-03-06.md'


2025-11-14 16:53:20,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:20,841 - INFO - Going to convert document batch...
2025-11-14 16:53:20,842 - INFO - Processing document 4_2025-03-07
2025-11-14 16:53:20,863 - INFO - Finished converting document 4_2025-03-07 in 0.05 sec.
2025-11-14 16:53:20,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:20,932 - INFO - Going to convert document batch...
2025-11-14 16:53:20,933 - INFO - Processing document 4_2025-03-12
2025-11-14 16:53:20,971 - INFO - Finished converting document 4_2025-03-12 in 0.08 sec.
2025-11-14 16:53:21,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:21,073 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ISRG\4_2025-03-07' --> 'data\processed_data\ISRG\4_2025-03-07.md'
Converted 'data\edgar_documents\ISRG\4_2025-03-12' --> 'data\processed_data\ISRG\4_2025-03-12.md'


2025-11-14 16:53:21,074 - INFO - Processing document 4_2025-03-14
2025-11-14 16:53:21,139 - INFO - Finished converting document 4_2025-03-14 in 0.14 sec.
2025-11-14 16:53:21,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:21,222 - INFO - Going to convert document batch...
2025-11-14 16:53:21,223 - INFO - Processing document 4_2025-04-25
2025-11-14 16:53:21,247 - INFO - Finished converting document 4_2025-04-25 in 0.06 sec.
2025-11-14 16:53:21,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:21,300 - INFO - Going to convert document batch...
2025-11-14 16:53:21,301 - INFO - Processing document 4_2025-04-28
2025-11-14 16:53:21,324 - INFO - Finished converting document 4_2025-04-28 in 0.06 sec.
2025-11-14 16:53:21,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2025-03-14' --> 'data\processed_data\ISRG\4_2025-03-14.md'
Converted 'data\edgar_documents\ISRG\4_2025-04-25' --> 'data\processed_data\ISRG\4_2025-04-25.md'
Converted 'data\edgar_documents\ISRG\4_2025-04-28' --> 'data\processed_data\ISRG\4_2025-04-28.md'


2025-11-14 16:53:21,413 - INFO - Going to convert document batch...
2025-11-14 16:53:21,414 - INFO - Processing document 4_2025-04-29
2025-11-14 16:53:21,478 - INFO - Finished converting document 4_2025-04-29 in 0.12 sec.
2025-11-14 16:53:21,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:21,687 - INFO - Going to convert document batch...
2025-11-14 16:53:21,688 - INFO - Processing document 4_2025-05-01
2025-11-14 16:53:21,713 - INFO - Finished converting document 4_2025-05-01 in 0.06 sec.
2025-11-14 16:53:21,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:21,779 - INFO - Going to convert document batch...
2025-11-14 16:53:21,780 - INFO - Processing document 4_2025-05-05
2025-11-14 16:53:21,824 - INFO - Finished converting document 4_2025-05-05 in 0.09 sec.


Converted 'data\edgar_documents\ISRG\4_2025-04-29' --> 'data\processed_data\ISRG\4_2025-04-29.md'
Converted 'data\edgar_documents\ISRG\4_2025-05-01' --> 'data\processed_data\ISRG\4_2025-05-01.md'
Converted 'data\edgar_documents\ISRG\4_2025-05-05' --> 'data\processed_data\ISRG\4_2025-05-05.md'


2025-11-14 16:53:21,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:21,922 - INFO - Going to convert document batch...
2025-11-14 16:53:21,924 - INFO - Processing document 4_2025-05-14
2025-11-14 16:53:21,951 - INFO - Finished converting document 4_2025-05-14 in 0.09 sec.
2025-11-14 16:53:21,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:22,007 - INFO - Going to convert document batch...
2025-11-14 16:53:22,008 - INFO - Processing document 4_2025-05-16
2025-11-14 16:53:22,031 - INFO - Finished converting document 4_2025-05-16 in 0.06 sec.
2025-11-14 16:53:22,079 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:22,088 - INFO - Going to convert document batch...
2025-11-14 16:53:22,089 - INFO - Processing document 4_2025-06-04
2025-11-14 16:53:22,109 - INFO - Finished converting document 4_2025-06-04 in 0.06 sec.
2025-11-14 16:53:22,158 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\4_2025-05-14' --> 'data\processed_data\ISRG\4_2025-05-14.md'
Converted 'data\edgar_documents\ISRG\4_2025-05-16' --> 'data\processed_data\ISRG\4_2025-05-16.md'
Converted 'data\edgar_documents\ISRG\4_2025-06-04' --> 'data\processed_data\ISRG\4_2025-06-04.md'


2025-11-14 16:53:22,167 - INFO - Going to convert document batch...
2025-11-14 16:53:22,168 - INFO - Processing document 4_2025-06-06
2025-11-14 16:53:22,279 - INFO - Finished converting document 4_2025-06-06 in 0.16 sec.
2025-11-14 16:53:22,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:22,383 - INFO - Going to convert document batch...
2025-11-14 16:53:22,385 - INFO - Processing document 4_2025-06-10
2025-11-14 16:53:22,412 - INFO - Finished converting document 4_2025-06-10 in 0.09 sec.
2025-11-14 16:53:22,471 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:22,486 - INFO - Going to convert document batch...
2025-11-14 16:53:22,489 - INFO - Processing document 4_2025-07-11


Converted 'data\edgar_documents\ISRG\4_2025-06-06' --> 'data\processed_data\ISRG\4_2025-06-06.md'
Converted 'data\edgar_documents\ISRG\4_2025-06-10' --> 'data\processed_data\ISRG\4_2025-06-10.md'


2025-11-14 16:53:22,521 - INFO - Finished converting document 4_2025-07-11 in 0.08 sec.
2025-11-14 16:53:22,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:22,597 - INFO - Going to convert document batch...
2025-11-14 16:53:22,598 - INFO - Processing document 4_2025-07-25
2025-11-14 16:53:22,621 - INFO - Finished converting document 4_2025-07-25 in 0.08 sec.
2025-11-14 16:53:22,666 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:22,683 - INFO - Going to convert document batch...
2025-11-14 16:53:22,685 - INFO - Processing document 4_2025-07-29
2025-11-14 16:53:22,714 - INFO - Finished converting document 4_2025-07-29 in 0.08 sec.


Converted 'data\edgar_documents\ISRG\4_2025-07-11' --> 'data\processed_data\ISRG\4_2025-07-11.md'
Converted 'data\edgar_documents\ISRG\4_2025-07-25' --> 'data\processed_data\ISRG\4_2025-07-25.md'


2025-11-14 16:53:22,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:22,776 - INFO - Going to convert document batch...
2025-11-14 16:53:22,777 - INFO - Processing document 4_2025-09-02
2025-11-14 16:53:22,806 - INFO - Finished converting document 4_2025-09-02 in 0.06 sec.
2025-11-14 16:53:22,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:22,893 - INFO - Going to convert document batch...
2025-11-14 16:53:22,895 - INFO - Processing document 4_2025-09-04
2025-11-14 16:53:22,931 - INFO - Finished converting document 4_2025-09-04 in 0.09 sec.


Converted 'data\edgar_documents\ISRG\4_2025-07-29' --> 'data\processed_data\ISRG\4_2025-07-29.md'
Converted 'data\edgar_documents\ISRG\4_2025-09-02' --> 'data\processed_data\ISRG\4_2025-09-02.md'


2025-11-14 16:53:23,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:23,096 - INFO - Going to convert document batch...
2025-11-14 16:53:23,098 - INFO - Processing document 4_2025-10-10
2025-11-14 16:53:23,124 - INFO - Finished converting document 4_2025-10-10 in 0.17 sec.


Converted 'data\edgar_documents\ISRG\4_2025-09-04' --> 'data\processed_data\ISRG\4_2025-09-04.md'


2025-11-14 16:53:23,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:23,185 - INFO - Going to convert document batch...
2025-11-14 16:53:23,186 - INFO - Processing document 4_2025-10-27
2025-11-14 16:53:23,212 - INFO - Finished converting document 4_2025-10-27 in 0.05 sec.
2025-11-14 16:53:23,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:23,300 - INFO - Going to convert document batch...
2025-11-14 16:53:23,302 - INFO - Processing document 4_2025-10-29
2025-11-14 16:53:23,346 - INFO - Finished converting document 4_2025-10-29 in 0.11 sec.


Converted 'data\edgar_documents\ISRG\4_2025-10-10' --> 'data\processed_data\ISRG\4_2025-10-10.md'
Converted 'data\edgar_documents\ISRG\4_2025-10-27' --> 'data\processed_data\ISRG\4_2025-10-27.md'


2025-11-14 16:53:23,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:23,522 - INFO - Going to convert document batch...
2025-11-14 16:53:23,523 - INFO - Processing document 4_2025-11-03
2025-11-14 16:53:23,562 - INFO - Finished converting document 4_2025-11-03 in 0.17 sec.


Converted 'data\edgar_documents\ISRG\4_2025-10-29' --> 'data\processed_data\ISRG\4_2025-10-29.md'


2025-11-14 16:53:23,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:23,647 - INFO - Going to convert document batch...
2025-11-14 16:53:23,648 - INFO - Processing document 4_2025-11-06
2025-11-14 16:53:23,688 - INFO - Finished converting document 4_2025-11-06 in 0.11 sec.
2025-11-14 16:53:23,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:23,768 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ISRG\4_2025-11-03' --> 'data\processed_data\ISRG\4_2025-11-03.md'
Converted 'data\edgar_documents\ISRG\4_2025-11-06' --> 'data\processed_data\ISRG\4_2025-11-06.md'


2025-11-14 16:53:23,769 - INFO - Processing document 8-K_2023-01-11
2025-11-14 16:53:23,885 - INFO - Finished converting document 8-K_2023-01-11 in 0.16 sec.
2025-11-14 16:53:23,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:23,952 - INFO - Going to convert document batch...
2025-11-14 16:53:23,953 - INFO - Processing document 8-K_2023-01-24
2025-11-14 16:53:23,978 - INFO - Finished converting document 8-K_2023-01-24 in 0.05 sec.
2025-11-14 16:53:24,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:24,033 - INFO - Going to convert document batch...
2025-11-14 16:53:24,033 - INFO - Processing document 8-K_2023-04-18
2025-11-14 16:53:24,062 - INFO - Finished converting document 8-K_2023-04-18 in 0.08 sec.


Converted 'data\edgar_documents\ISRG\8-K_2023-01-11' --> 'data\processed_data\ISRG\8-K_2023-01-11.md'
Converted 'data\edgar_documents\ISRG\8-K_2023-01-24' --> 'data\processed_data\ISRG\8-K_2023-01-24.md'
Converted 'data\edgar_documents\ISRG\8-K_2023-04-18' --> 'data\processed_data\ISRG\8-K_2023-04-18.md'


2025-11-14 16:53:24,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:24,141 - INFO - Going to convert document batch...
2025-11-14 16:53:24,141 - INFO - Processing document 8-K_2023-05-02
2025-11-14 16:53:24,199 - INFO - Finished converting document 8-K_2023-05-02 in 0.12 sec.
2025-11-14 16:53:24,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:24,283 - INFO - Going to convert document batch...
2025-11-14 16:53:24,284 - INFO - Processing document 8-K_2023-05-16
2025-11-14 16:53:24,308 - INFO - Finished converting document 8-K_2023-05-16 in 0.09 sec.
2025-11-14 16:53:24,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:24,372 - INFO - Going to convert document batch...
2025-11-14 16:53:24,373 - INFO - Processing document 8-K_2023-07-20
2025-11-14 16:53:24,404 - INFO - Finished converting document 8-K_2023-07-20 in 0.09 sec.


Converted 'data\edgar_documents\ISRG\8-K_2023-05-02' --> 'data\processed_data\ISRG\8-K_2023-05-02.md'
Converted 'data\edgar_documents\ISRG\8-K_2023-05-16' --> 'data\processed_data\ISRG\8-K_2023-05-16.md'


2025-11-14 16:53:24,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:24,462 - INFO - Going to convert document batch...
2025-11-14 16:53:24,463 - INFO - Processing document 8-K_2023-10-19
2025-11-14 16:53:24,496 - INFO - Finished converting document 8-K_2023-10-19 in 0.08 sec.
2025-11-14 16:53:24,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:24,558 - INFO - Going to convert document batch...
2025-11-14 16:53:24,559 - INFO - Processing document 8-K_2023-10-31
2025-11-14 16:53:24,586 - INFO - Finished converting document 8-K_2023-10-31 in 0.06 sec.
2025-11-14 16:53:24,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\8-K_2023-07-20' --> 'data\processed_data\ISRG\8-K_2023-07-20.md'
Converted 'data\edgar_documents\ISRG\8-K_2023-10-19' --> 'data\processed_data\ISRG\8-K_2023-10-19.md'
Converted 'data\edgar_documents\ISRG\8-K_2023-10-31' --> 'data\processed_data\ISRG\8-K_2023-10-31.md'


2025-11-14 16:53:24,653 - INFO - Going to convert document batch...
2025-11-14 16:53:24,654 - INFO - Processing document 8-K_2024-01-09
2025-11-14 16:53:24,699 - INFO - Finished converting document 8-K_2024-01-09 in 0.11 sec.
2025-11-14 16:53:24,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:24,756 - INFO - Going to convert document batch...
2025-11-14 16:53:24,761 - INFO - Processing document 8-K_2024-01-23
2025-11-14 16:53:24,807 - INFO - Finished converting document 8-K_2024-01-23 in 0.09 sec.
2025-11-14 16:53:24,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:24,871 - INFO - Going to convert document batch...
2025-11-14 16:53:24,872 - INFO - Processing document 8-K_2024-03-14
2025-11-14 16:53:24,893 - INFO - Finished converting document 8-K_2024-03-14 in 0.08 sec.


Converted 'data\edgar_documents\ISRG\8-K_2024-01-09' --> 'data\processed_data\ISRG\8-K_2024-01-09.md'
Converted 'data\edgar_documents\ISRG\8-K_2024-01-23' --> 'data\processed_data\ISRG\8-K_2024-01-23.md'


2025-11-14 16:53:24,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:24,941 - INFO - Going to convert document batch...
2025-11-14 16:53:24,942 - INFO - Processing document 8-K_2024-04-18
2025-11-14 16:53:24,990 - INFO - Finished converting document 8-K_2024-04-18 in 0.08 sec.
2025-11-14 16:53:25,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:25,050 - INFO - Going to convert document batch...
2025-11-14 16:53:25,051 - INFO - Processing document 8-K_2024-04-30
2025-11-14 16:53:25,093 - INFO - Finished converting document 8-K_2024-04-30 in 0.09 sec.


Converted 'data\edgar_documents\ISRG\8-K_2024-03-14' --> 'data\processed_data\ISRG\8-K_2024-03-14.md'
Converted 'data\edgar_documents\ISRG\8-K_2024-04-18' --> 'data\processed_data\ISRG\8-K_2024-04-18.md'


2025-11-14 16:53:25,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:25,150 - INFO - Going to convert document batch...
2025-11-14 16:53:25,151 - INFO - Processing document 8-K_2024-07-18
2025-11-14 16:53:25,184 - INFO - Finished converting document 8-K_2024-07-18 in 0.08 sec.
2025-11-14 16:53:25,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\8-K_2024-04-30' --> 'data\processed_data\ISRG\8-K_2024-04-30.md'
Converted 'data\edgar_documents\ISRG\8-K_2024-07-18' --> 'data\processed_data\ISRG\8-K_2024-07-18.md'


2025-11-14 16:53:25,318 - INFO - Going to convert document batch...
2025-11-14 16:53:25,325 - INFO - Processing document 8-K_2024-07-25
2025-11-14 16:53:25,353 - INFO - Finished converting document 8-K_2024-07-25 in 0.14 sec.
2025-11-14 16:53:25,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:25,425 - INFO - Going to convert document batch...
2025-11-14 16:53:25,425 - INFO - Processing document 8-K_2024-10-17
2025-11-14 16:53:25,450 - INFO - Finished converting document 8-K_2024-10-17 in 0.09 sec.
2025-11-14 16:53:25,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:25,517 - INFO - Going to convert document batch...
2025-11-14 16:53:25,518 - INFO - Processing document 8-K_2025-01-06
2025-11-14 16:53:25,541 - INFO - Finished converting document 8-K_2025-01-06 in 0.08 sec.


Converted 'data\edgar_documents\ISRG\8-K_2024-07-25' --> 'data\processed_data\ISRG\8-K_2024-07-25.md'
Converted 'data\edgar_documents\ISRG\8-K_2024-10-17' --> 'data\processed_data\ISRG\8-K_2024-10-17.md'


2025-11-14 16:53:25,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:25,592 - INFO - Going to convert document batch...
2025-11-14 16:53:25,593 - INFO - Processing document 8-K_2025-01-15
2025-11-14 16:53:25,626 - INFO - Finished converting document 8-K_2025-01-15 in 0.08 sec.
2025-11-14 16:53:25,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:25,686 - INFO - Going to convert document batch...
2025-11-14 16:53:25,687 - INFO - Processing document 8-K_2025-01-23
2025-11-14 16:53:25,718 - INFO - Finished converting document 8-K_2025-01-23 in 0.06 sec.


Converted 'data\edgar_documents\ISRG\8-K_2025-01-06' --> 'data\processed_data\ISRG\8-K_2025-01-06.md'
Converted 'data\edgar_documents\ISRG\8-K_2025-01-15' --> 'data\processed_data\ISRG\8-K_2025-01-15.md'


2025-11-14 16:53:25,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:25,898 - INFO - Going to convert document batch...
2025-11-14 16:53:25,899 - INFO - Processing document 8-K_2025-04-22


Converted 'data\edgar_documents\ISRG\8-K_2025-01-23' --> 'data\processed_data\ISRG\8-K_2025-01-23.md'


2025-11-14 16:53:26,211 - INFO - Finished converting document 8-K_2025-04-22 in 0.38 sec.
2025-11-14 16:53:26,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:26,378 - INFO - Going to convert document batch...
2025-11-14 16:53:26,379 - INFO - Processing document 8-K_2025-05-05
2025-11-14 16:53:26,426 - INFO - Finished converting document 8-K_2025-05-05 in 0.19 sec.


Converted 'data\edgar_documents\ISRG\8-K_2025-04-22' --> 'data\processed_data\ISRG\8-K_2025-04-22.md'
Converted 'data\edgar_documents\ISRG\8-K_2025-05-05' --> 'data\processed_data\ISRG\8-K_2025-05-05.md'


2025-11-14 16:53:26,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:26,728 - INFO - Going to convert document batch...
2025-11-14 16:53:26,729 - INFO - Processing document 8-K_2025-05-15
2025-11-14 16:53:26,754 - INFO - Finished converting document 8-K_2025-05-15 in 0.30 sec.
2025-11-14 16:53:26,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:53:26,821 - INFO - Going to convert document batch...
2025-11-14 16:53:26,822 - INFO - Processing document 8-K_2025-07-22
2025-11-14 16:53:26,854 - INFO - Finished converting document 8-K_2025-07-22 in 0.09 sec.
2025-11-14 16:53:26,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\8-K_2025-05-15' --> 'data\processed_data\ISRG\8-K_2025-05-15.md'
Converted 'data\edgar_documents\ISRG\8-K_2025-07-22' --> 'data\processed_data\ISRG\8-K_2025-07-22.md'


2025-11-14 16:53:27,329 - INFO - Going to convert document batch...
2025-11-14 16:53:27,330 - INFO - Processing document DEF-14A_2023-03-10
2025-11-14 16:53:28,079 - INFO - Finished converting document DEF-14A_2023-03-10 in 1.22 sec.
2025-11-14 16:53:28,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\DEF-14A_2023-03-10' --> 'data\processed_data\ISRG\DEF-14A_2023-03-10.md'


2025-11-14 16:53:29,309 - INFO - Going to convert document batch...
2025-11-14 16:53:29,310 - INFO - Processing document DEF-14A_2024-03-08
2025-11-14 16:53:30,216 - INFO - Finished converting document DEF-14A_2024-03-08 in 1.64 sec.
2025-11-14 16:53:30,826 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\DEF-14A_2024-03-08' --> 'data\processed_data\ISRG\DEF-14A_2024-03-08.md'


2025-11-14 16:53:31,245 - INFO - Going to convert document batch...
2025-11-14 16:53:31,246 - INFO - Processing document DEF-14A_2025-03-14
2025-11-14 16:53:32,234 - INFO - Finished converting document DEF-14A_2025-03-14 in 1.44 sec.
2025-11-14 16:53:33,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ISRG\DEF-14A_2025-03-14' --> 'data\processed_data\ISRG\DEF-14A_2025-03-14.md'
Processed 150 new files. Errors: 0
Found 130 files to process in data\edgar_documents\JNJ


2025-11-14 16:53:35,148 - INFO - Going to convert document batch...
2025-11-14 16:53:35,149 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:53:35,149 - INFO - Processing document 10-K_2023-02-16
2025-11-14 16:53:38,218 - INFO - Finished converting document 10-K_2023-02-16 in 5.22 sec.
2025-11-14 16:53:39,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-K_2023-02-16' --> 'data\processed_data\JNJ\10-K_2023-02-16.md'


2025-11-14 16:53:41,038 - INFO - Going to convert document batch...
2025-11-14 16:53:41,040 - INFO - Processing document 10-K_2024-02-16
2025-11-14 16:53:44,055 - INFO - Finished converting document 10-K_2024-02-16 in 4.86 sec.
2025-11-14 16:53:45,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-K_2024-02-16' --> 'data\processed_data\JNJ\10-K_2024-02-16.md'


2025-11-14 16:53:47,068 - INFO - Going to convert document batch...
2025-11-14 16:53:47,069 - INFO - Processing document 10-K_2025-02-13
2025-11-14 16:53:50,531 - INFO - Finished converting document 10-K_2025-02-13 in 5.53 sec.
2025-11-14 16:53:51,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-K_2025-02-13' --> 'data\processed_data\JNJ\10-K_2025-02-13.md'


2025-11-14 16:53:53,046 - INFO - Going to convert document batch...
2025-11-14 16:53:53,047 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 16:53:54,255 - INFO - Finished converting document 10-Q_2023-04-28 in 2.72 sec.
2025-11-14 16:53:55,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-Q_2023-04-28' --> 'data\processed_data\JNJ\10-Q_2023-04-28.md'


2025-11-14 16:53:56,884 - INFO - Going to convert document batch...
2025-11-14 16:53:56,884 - INFO - Processing document 10-Q_2023-07-31
2025-11-14 16:53:58,628 - INFO - Finished converting document 10-Q_2023-07-31 in 3.56 sec.
2025-11-14 16:53:59,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-Q_2023-07-31' --> 'data\processed_data\JNJ\10-Q_2023-07-31.md'


2025-11-14 16:54:00,807 - INFO - Going to convert document batch...
2025-11-14 16:54:00,808 - INFO - Processing document 10-Q_2023-10-27
2025-11-14 16:54:02,548 - INFO - Finished converting document 10-Q_2023-10-27 in 3.25 sec.
2025-11-14 16:54:04,108 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-Q_2023-10-27' --> 'data\processed_data\JNJ\10-Q_2023-10-27.md'


2025-11-14 16:54:04,676 - INFO - Going to convert document batch...
2025-11-14 16:54:04,676 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 16:54:06,066 - INFO - Finished converting document 10-Q_2024-05-01 in 2.00 sec.
2025-11-14 16:54:06,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-Q_2024-05-01' --> 'data\processed_data\JNJ\10-Q_2024-05-01.md'


2025-11-14 16:54:08,301 - INFO - Going to convert document batch...
2025-11-14 16:54:08,302 - INFO - Processing document 10-Q_2024-07-25
2025-11-14 16:54:10,406 - INFO - Finished converting document 10-Q_2024-07-25 in 3.73 sec.
2025-11-14 16:54:12,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-Q_2024-07-25' --> 'data\processed_data\JNJ\10-Q_2024-07-25.md'


2025-11-14 16:54:12,884 - INFO - Going to convert document batch...
2025-11-14 16:54:12,885 - INFO - Processing document 10-Q_2024-10-23
2025-11-14 16:54:15,076 - INFO - Finished converting document 10-Q_2024-10-23 in 3.08 sec.
2025-11-14 16:54:16,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-Q_2024-10-23' --> 'data\processed_data\JNJ\10-Q_2024-10-23.md'


2025-11-14 16:54:16,640 - INFO - Going to convert document batch...
2025-11-14 16:54:16,641 - INFO - Processing document 10-Q_2025-04-23
2025-11-14 16:54:18,054 - INFO - Finished converting document 10-Q_2025-04-23 in 2.06 sec.
2025-11-14 16:54:18,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-Q_2025-04-23' --> 'data\processed_data\JNJ\10-Q_2025-04-23.md'


2025-11-14 16:54:20,370 - INFO - Going to convert document batch...
2025-11-14 16:54:20,370 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 16:54:22,289 - INFO - Finished converting document 10-Q_2025-07-24 in 3.62 sec.
2025-11-14 16:54:23,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\10-Q_2025-07-24' --> 'data\processed_data\JNJ\10-Q_2025-07-24.md'


2025-11-14 16:54:24,243 - INFO - Going to convert document batch...
2025-11-14 16:54:24,244 - INFO - Processing document 10-Q_2025-10-22
2025-11-14 16:54:26,069 - INFO - Finished converting document 10-Q_2025-10-22 in 3.06 sec.
2025-11-14 16:54:27,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:27,180 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\JNJ\10-Q_2025-10-22' --> 'data\processed_data\JNJ\10-Q_2025-10-22.md'


2025-11-14 16:54:27,182 - INFO - Processing document 4_2023-01-18
2025-11-14 16:54:27,209 - INFO - Finished converting document 4_2023-01-18 in 0.22 sec.
2025-11-14 16:54:27,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:27,297 - INFO - Going to convert document batch...
2025-11-14 16:54:27,299 - INFO - Processing document 4_2023-02-14
2025-11-14 16:54:27,329 - INFO - Finished converting document 4_2023-02-14 in 0.06 sec.
2025-11-14 16:54:27,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:27,397 - INFO - Going to convert document batch...
2025-11-14 16:54:27,398 - INFO - Processing document 4_2023-02-15
2025-11-14 16:54:27,431 - INFO - Finished converting document 4_2023-02-15 in 0.06 sec.


Converted 'data\edgar_documents\JNJ\4_2023-01-18' --> 'data\processed_data\JNJ\4_2023-01-18.md'
Converted 'data\edgar_documents\JNJ\4_2023-02-14' --> 'data\processed_data\JNJ\4_2023-02-14.md'


2025-11-14 16:54:27,482 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:27,599 - INFO - Going to convert document batch...
2025-11-14 16:54:27,600 - INFO - Processing document 4_2023-03-08
2025-11-14 16:54:27,639 - INFO - Finished converting document 4_2023-03-08 in 0.19 sec.


Converted 'data\edgar_documents\JNJ\4_2023-02-15' --> 'data\processed_data\JNJ\4_2023-02-15.md'


2025-11-14 16:54:27,698 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:27,713 - INFO - Going to convert document batch...
2025-11-14 16:54:27,714 - INFO - Processing document 4_2023-03-09
2025-11-14 16:54:27,754 - INFO - Finished converting document 4_2023-03-09 in 0.08 sec.
2025-11-14 16:54:27,848 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:27,856 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\JNJ\4_2023-03-08' --> 'data\processed_data\JNJ\4_2023-03-08.md'
Converted 'data\edgar_documents\JNJ\4_2023-03-09' --> 'data\processed_data\JNJ\4_2023-03-09.md'


2025-11-14 16:54:27,857 - INFO - Processing document 4_2023-05-02
2025-11-14 16:54:27,879 - INFO - Finished converting document 4_2023-05-02 in 0.08 sec.
2025-11-14 16:54:27,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:28,014 - INFO - Going to convert document batch...
2025-11-14 16:54:28,019 - INFO - Processing document 4_2023-05-25


Converted 'data\edgar_documents\JNJ\4_2023-05-02' --> 'data\processed_data\JNJ\4_2023-05-02.md'


2025-11-14 16:54:28,705 - INFO - Finished converting document 4_2023-05-25 in 0.80 sec.
2025-11-14 16:54:28,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:28,772 - INFO - Going to convert document batch...
2025-11-14 16:54:28,773 - INFO - Processing document 4_2023-06-08
2025-11-14 16:54:28,794 - INFO - Finished converting document 4_2023-06-08 in 0.06 sec.
2025-11-14 16:54:28,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:28,875 - INFO - Going to convert document batch...
2025-11-14 16:54:28,876 - INFO - Processing document 4_2023-06-14
2025-11-14 16:54:28,899 - INFO - Finished converting document 4_2023-06-14 in 0.06 sec.


Converted 'data\edgar_documents\JNJ\4_2023-05-25' --> 'data\processed_data\JNJ\4_2023-05-25.md'
Converted 'data\edgar_documents\JNJ\4_2023-06-08' --> 'data\processed_data\JNJ\4_2023-06-08.md'
Converted 'data\edgar_documents\JNJ\4_2023-06-14' --> 'data\processed_data\JNJ\4_2023-06-14.md'


2025-11-14 16:54:28,963 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:54:28,963 - ERROR - Input document 4_2023-07-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:54:28,966 - INFO - Going to convert document batch...
2025-11-14 16:54:28,983 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:54:28,984 - ERROR - Input document 4_2023-07-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\JNJ\4_2023-07-20: File format not allowed: data\edgar_documents\JNJ\4_2023-07-20
Error processing data\edgar_documents\JNJ\4_2023-07-24: File format not allowed: data\edgar_documents\JNJ\4_2023-07-24
Error processing data\edgar_documents\JNJ\4_2023-07-25: File format not allowed: data\edgar_documents\JNJ\4_2023-07-25
Error processing data\edgar_documents\JNJ\4_2023-07-26: File format not allowed: data\edgar_documents\JNJ\4_2023-07-26
Converted 'data\edgar_documents\JNJ\4_2023-07-27' --> 'data\processed_data\JNJ\4_2023-07-27.md'
Error processing data\edgar_documents\JNJ\4_2023-07-28: File format not allowed: data\edgar_documents\JNJ\4_2023-07-28
Error processing data\edgar_documents\JNJ\4_2023-07-31: File format not allowed: data\edgar_documents\JNJ\4_2023-07-31


2025-11-14 16:54:29,157 - ERROR - Input document 4_2023-08-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:54:29,159 - INFO - Going to convert document batch...
2025-11-14 16:54:29,181 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:54:29,182 - ERROR - Input document 4_2023-08-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\JNJ\4_2023-08-01: File format not allowed: data\edgar_documents\JNJ\4_2023-08-01
Error processing data\edgar_documents\JNJ\4_2023-08-02: File format not allowed: data\edgar_documents\JNJ\4_2023-08-02
Error processing data\edgar_documents\JNJ\4_2023-08-03: File format not allowed: data\edgar_documents\JNJ\4_2023-08-03
Error processing data\edgar_documents\JNJ\4_2023-08-04: File format not allowed: data\edgar_documents\JNJ\4_2023-08-04
Error processing data\edgar_documents\JNJ\4_2023-08-07: File format not allowed: data\edgar_documents\JNJ\4_2023-08-07
Error processing data\edgar_documents\JNJ\4_2023-08-08: File format not allowed: data\edgar_documents\JNJ\4_2023-08-08
Error processing data\edgar_documents\JNJ\4_2023-08-09: File format not allowed: data\edgar_documents\JNJ\4_2023-08-09
Error processing data\edgar_documents\JNJ\4_2023-08-10: File format not allowed: data\edgar_documents\JNJ\4_2023-08-10
Error processing data\edgar_documents\JNJ\4_2023

2025-11-14 16:54:29,338 - ERROR - Input document 4_2023-08-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:54:29,340 - INFO - Going to convert document batch...
2025-11-14 16:54:29,355 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:54:29,355 - ERROR - Input document 4_2023-08-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\JNJ\4_2023-08-15: File format not allowed: data\edgar_documents\JNJ\4_2023-08-15
Error processing data\edgar_documents\JNJ\4_2023-08-16: File format not allowed: data\edgar_documents\JNJ\4_2023-08-16
Error processing data\edgar_documents\JNJ\4_2023-08-17: File format not allowed: data\edgar_documents\JNJ\4_2023-08-17
Error processing data\edgar_documents\JNJ\4_2023-08-18: File format not allowed: data\edgar_documents\JNJ\4_2023-08-18
Error processing data\edgar_documents\JNJ\4_2023-08-21: File format not allowed: data\edgar_documents\JNJ\4_2023-08-21
Error processing data\edgar_documents\JNJ\4_2023-08-23: File format not allowed: data\edgar_documents\JNJ\4_2023-08-23
Converted 'data\edgar_documents\JNJ\4_2023-08-25' --> 'data\processed_data\JNJ\4_2023-08-25.md'


2025-11-14 16:54:29,541 - INFO - Going to convert document batch...
2025-11-14 16:54:29,542 - INFO - Processing document 4_2023-09-11
2025-11-14 16:54:29,580 - INFO - Finished converting document 4_2023-09-11 in 0.08 sec.
2025-11-14 16:54:29,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:29,636 - INFO - Going to convert document batch...
2025-11-14 16:54:29,637 - INFO - Processing document 4_2023-12-07
2025-11-14 16:54:29,664 - INFO - Finished converting document 4_2023-12-07 in 0.05 sec.
2025-11-14 16:54:29,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:29,732 - INFO - Going to convert document batch...
2025-11-14 16:54:29,734 - INFO - Processing document 4_2024-02-12
2025-11-14 16:54:29,775 - INFO - Finished converting document 4_2024-02-12 in 0.08 sec.


Converted 'data\edgar_documents\JNJ\4_2023-09-11' --> 'data\processed_data\JNJ\4_2023-09-11.md'
Converted 'data\edgar_documents\JNJ\4_2023-12-07' --> 'data\processed_data\JNJ\4_2023-12-07.md'


2025-11-14 16:54:29,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:29,864 - INFO - Going to convert document batch...
2025-11-14 16:54:29,866 - INFO - Processing document 4_2024-02-13
2025-11-14 16:54:29,897 - INFO - Finished converting document 4_2024-02-13 in 0.09 sec.
2025-11-14 16:54:29,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:29,975 - INFO - Going to convert document batch...
2025-11-14 16:54:29,976 - INFO - Processing document 4_2024-02-14


Converted 'data\edgar_documents\JNJ\4_2024-02-12' --> 'data\processed_data\JNJ\4_2024-02-12.md'
Converted 'data\edgar_documents\JNJ\4_2024-02-13' --> 'data\processed_data\JNJ\4_2024-02-13.md'


2025-11-14 16:54:30,000 - INFO - Finished converting document 4_2024-02-14 in 0.08 sec.
2025-11-14 16:54:30,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:30,059 - INFO - Going to convert document batch...
2025-11-14 16:54:30,060 - INFO - Processing document 4_2024-02-15
2025-11-14 16:54:30,089 - INFO - Finished converting document 4_2024-02-15 in 0.06 sec.
2025-11-14 16:54:30,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:30,163 - INFO - Going to convert document batch...
2025-11-14 16:54:30,164 - INFO - Processing document 4_2024-02-20
2025-11-14 16:54:30,201 - INFO - Finished converting document 4_2024-02-20 in 0.09 sec.


Converted 'data\edgar_documents\JNJ\4_2024-02-14' --> 'data\processed_data\JNJ\4_2024-02-14.md'
Converted 'data\edgar_documents\JNJ\4_2024-02-15' --> 'data\processed_data\JNJ\4_2024-02-15.md'


2025-11-14 16:54:30,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:30,308 - INFO - Going to convert document batch...
2025-11-14 16:54:30,308 - INFO - Processing document 4_2024-03-06
2025-11-14 16:54:30,412 - INFO - Finished converting document 4_2024-03-06 in 0.19 sec.


Converted 'data\edgar_documents\JNJ\4_2024-02-20' --> 'data\processed_data\JNJ\4_2024-02-20.md'


2025-11-14 16:54:30,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:30,661 - INFO - Going to convert document batch...
2025-11-14 16:54:30,663 - INFO - Processing document 4_2024-03-07
2025-11-14 16:54:30,700 - INFO - Finished converting document 4_2024-03-07 in 0.11 sec.
2025-11-14 16:54:30,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:30,787 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\JNJ\4_2024-03-06' --> 'data\processed_data\JNJ\4_2024-03-06.md'
Converted 'data\edgar_documents\JNJ\4_2024-03-07' --> 'data\processed_data\JNJ\4_2024-03-07.md'


2025-11-14 16:54:30,789 - INFO - Processing document 4_2024-03-13
2025-11-14 16:54:30,818 - INFO - Finished converting document 4_2024-03-13 in 0.08 sec.
2025-11-14 16:54:30,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:30,883 - INFO - Going to convert document batch...
2025-11-14 16:54:30,884 - INFO - Processing document 4_2024-04-29
2025-11-14 16:54:31,000 - INFO - Finished converting document 4_2024-04-29 in 0.16 sec.


Converted 'data\edgar_documents\JNJ\4_2024-03-13' --> 'data\processed_data\JNJ\4_2024-03-13.md'


2025-11-14 16:54:31,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:31,089 - INFO - Going to convert document batch...
2025-11-14 16:54:31,090 - INFO - Processing document 4_2024-05-03
2025-11-14 16:54:31,119 - INFO - Finished converting document 4_2024-05-03 in 0.09 sec.
2025-11-14 16:54:31,196 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:54:31,196 - ERROR - Input document 4_2024-05-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:54

Converted 'data\edgar_documents\JNJ\4_2024-04-29' --> 'data\processed_data\JNJ\4_2024-04-29.md'
Converted 'data\edgar_documents\JNJ\4_2024-05-03' --> 'data\processed_data\JNJ\4_2024-05-03.md'
Error processing data\edgar_documents\JNJ\4_2024-05-13: File format not allowed: data\edgar_documents\JNJ\4_2024-05-13


2025-11-14 16:54:31,219 - ERROR - Input document 4_2024-05-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:54:31,221 - INFO - Going to convert document batch...
2025-11-14 16:54:31,245 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:54:31,246 - ERROR - Input document 4_2024-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\JNJ\4_2024-05-14: File format not allowed: data\edgar_documents\JNJ\4_2024-05-14
Error processing data\edgar_documents\JNJ\4_2024-05-15: File format not allowed: data\edgar_documents\JNJ\4_2024-05-15
Error processing data\edgar_documents\JNJ\4_2024-05-16: File format not allowed: data\edgar_documents\JNJ\4_2024-05-16


2025-11-14 16:54:31,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:31,471 - INFO - Going to convert document batch...
2025-11-14 16:54:31,473 - INFO - Processing document 4_2024-07-09
2025-11-14 16:54:31,526 - INFO - Finished converting document 4_2024-07-09 in 0.11 sec.


Converted 'data\edgar_documents\JNJ\4_2024-06-06' --> 'data\processed_data\JNJ\4_2024-06-06.md'
Converted 'data\edgar_documents\JNJ\4_2024-07-09' --> 'data\processed_data\JNJ\4_2024-07-09.md'


2025-11-14 16:54:31,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:31,661 - INFO - Going to convert document batch...
2025-11-14 16:54:31,662 - INFO - Processing document 4_2024-09-03
2025-11-14 16:54:31,761 - INFO - Finished converting document 4_2024-09-03 in 0.19 sec.
2025-11-14 16:54:31,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:31,863 - INFO - Going to convert document batch...
2025-11-14 16:54:31,864 - INFO - Processing document 4_2024-09-12
2025-11-14 16:54:31,895 - INFO - Finished converting document 4_2024-09-12 in 0.09 sec.
2025-11-14 16:54:31,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:31,954 - INFO - Going to convert document batch...
2025-11-14 16:54:31,955 - INFO - Processing document 4_2024-10-15
2025-11-14 16:54:31,978 - INFO - Finished converting document 4_2024-10-15 in 0.05 sec.


Converted 'data\edgar_documents\JNJ\4_2024-09-03' --> 'data\processed_data\JNJ\4_2024-09-03.md'
Converted 'data\edgar_documents\JNJ\4_2024-09-12' --> 'data\processed_data\JNJ\4_2024-09-12.md'


2025-11-14 16:54:32,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:32,047 - INFO - Going to convert document batch...
2025-11-14 16:54:32,049 - INFO - Processing document 4_2024-10-21
2025-11-14 16:54:32,084 - INFO - Finished converting document 4_2024-10-21 in 0.08 sec.
2025-11-14 16:54:32,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:32,153 - INFO - Going to convert document batch...
2025-11-14 16:54:32,154 - INFO - Processing document 4_2024-10-31
2025-11-14 16:54:32,180 - INFO - Finished converting document 4_2024-10-31 in 0.06 sec.


Converted 'data\edgar_documents\JNJ\4_2024-10-15' --> 'data\processed_data\JNJ\4_2024-10-15.md'
Converted 'data\edgar_documents\JNJ\4_2024-10-21' --> 'data\processed_data\JNJ\4_2024-10-21.md'


2025-11-14 16:54:32,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:32,251 - INFO - Going to convert document batch...
2025-11-14 16:54:32,252 - INFO - Processing document 4_2024-12-12
2025-11-14 16:54:32,282 - INFO - Finished converting document 4_2024-12-12 in 0.08 sec.
2025-11-14 16:54:32,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:32,349 - INFO - Going to convert document batch...
2025-11-14 16:54:32,350 - INFO - Processing document 4_2025-02-11
2025-11-14 16:54:32,373 - INFO - Finished converting document 4_2025-02-11 in 0.06 sec.


Converted 'data\edgar_documents\JNJ\4_2024-10-31' --> 'data\processed_data\JNJ\4_2024-10-31.md'
Converted 'data\edgar_documents\JNJ\4_2024-12-12' --> 'data\processed_data\JNJ\4_2024-12-12.md'
Converted 'data\edgar_documents\JNJ\4_2025-02-11' --> 'data\processed_data\JNJ\4_2025-02-11.md'


2025-11-14 16:54:32,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:32,439 - INFO - Going to convert document batch...
2025-11-14 16:54:32,440 - INFO - Processing document 4_2025-02-12
2025-11-14 16:54:32,472 - INFO - Finished converting document 4_2025-02-12 in 0.06 sec.
2025-11-14 16:54:32,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:32,579 - INFO - Going to convert document batch...
2025-11-14 16:54:32,580 - INFO - Processing document 4_2025-02-18
2025-11-14 16:54:32,605 - INFO - Finished converting document 4_2025-02-18 in 0.09 sec.
2025-11-14 16:54:32,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:32,674 - INFO - Going to convert document batch...
2025-11-14 16:54:32,676 - INFO - Processing document 4_2025-02-19
2025-11-14 16:54:32,704 - INFO - Finished converting document 4_2025-02-19 in 0.08 sec.


Converted 'data\edgar_documents\JNJ\4_2025-02-12' --> 'data\processed_data\JNJ\4_2025-02-12.md'
Converted 'data\edgar_documents\JNJ\4_2025-02-18' --> 'data\processed_data\JNJ\4_2025-02-18.md'


2025-11-14 16:54:32,769 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:54:32,770 - ERROR - Input document 4_2025-02-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:54:32,771 - INFO - Going to convert document batch...
2025-11-14 16:54:32,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:32,801 - INFO - Going to convert document batch...
2025-11-14 16:54:32,802 - INFO - Processing document 4_2025-02-26
2025-11-14 16:54:32,833 - INFO - Fin

Converted 'data\edgar_documents\JNJ\4_2025-02-19' --> 'data\processed_data\JNJ\4_2025-02-19.md'
Error processing data\edgar_documents\JNJ\4_2025-02-21: File format not allowed: data\edgar_documents\JNJ\4_2025-02-21
Converted 'data\edgar_documents\JNJ\4_2025-02-26' --> 'data\processed_data\JNJ\4_2025-02-26.md'


2025-11-14 16:54:32,977 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:32,990 - INFO - Going to convert document batch...
2025-11-14 16:54:32,992 - INFO - Processing document 4_2025-03-19
2025-11-14 16:54:33,016 - INFO - Finished converting document 4_2025-03-19 in 0.06 sec.
2025-11-14 16:54:33,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:33,076 - INFO - Going to convert document batch...
2025-11-14 16:54:33,077 - INFO - Processing document 4_2025-04-28
2025-11-14 16:54:33,105 - INFO - Finished converting document 4_2025-04-28 in 0.08 sec.
2025-11-14 16:54:33,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\4_2025-03-06' --> 'data\processed_data\JNJ\4_2025-03-06.md'
Converted 'data\edgar_documents\JNJ\4_2025-03-19' --> 'data\processed_data\JNJ\4_2025-03-19.md'
Converted 'data\edgar_documents\JNJ\4_2025-04-28' --> 'data\processed_data\JNJ\4_2025-04-28.md'


2025-11-14 16:54:33,172 - INFO - Going to convert document batch...
2025-11-14 16:54:33,173 - INFO - Processing document 4_2025-05-05
2025-11-14 16:54:33,208 - INFO - Finished converting document 4_2025-05-05 in 0.08 sec.
2025-11-14 16:54:33,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:33,266 - INFO - Going to convert document batch...
2025-11-14 16:54:33,268 - INFO - Processing document 4_2025-06-12
2025-11-14 16:54:33,289 - INFO - Finished converting document 4_2025-06-12 in 0.05 sec.
2025-11-14 16:54:33,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:33,360 - INFO - Going to convert document batch...
2025-11-14 16:54:33,362 - INFO - Processing document 4_2025-07-18
2025-11-14 16:54:33,383 - INFO - Finished converting document 4_2025-07-18 in 0.05 sec.
2025-11-14 16:54:33,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\4_2025-05-05' --> 'data\processed_data\JNJ\4_2025-05-05.md'
Converted 'data\edgar_documents\JNJ\4_2025-06-12' --> 'data\processed_data\JNJ\4_2025-06-12.md'
Converted 'data\edgar_documents\JNJ\4_2025-07-18' --> 'data\processed_data\JNJ\4_2025-07-18.md'


2025-11-14 16:54:33,430 - INFO - Going to convert document batch...
2025-11-14 16:54:33,431 - INFO - Processing document 4_2025-08-18
2025-11-14 16:54:33,471 - INFO - Finished converting document 4_2025-08-18 in 0.06 sec.
2025-11-14 16:54:33,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:33,532 - INFO - Going to convert document batch...
2025-11-14 16:54:33,533 - INFO - Processing document 4_2025-08-25
2025-11-14 16:54:33,556 - INFO - Finished converting document 4_2025-08-25 in 0.05 sec.
2025-11-14 16:54:33,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:33,614 - INFO - Going to convert document batch...
2025-11-14 16:54:33,615 - INFO - Processing document 4_2025-09-03
2025-11-14 16:54:33,641 - INFO - Finished converting document 4_2025-09-03 in 0.06 sec.
2025-11-14 16:54:33,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\4_2025-08-18' --> 'data\processed_data\JNJ\4_2025-08-18.md'
Converted 'data\edgar_documents\JNJ\4_2025-08-25' --> 'data\processed_data\JNJ\4_2025-08-25.md'
Converted 'data\edgar_documents\JNJ\4_2025-09-03' --> 'data\processed_data\JNJ\4_2025-09-03.md'


2025-11-14 16:54:33,697 - INFO - Going to convert document batch...
2025-11-14 16:54:33,698 - INFO - Processing document 4_2025-09-05
2025-11-14 16:54:33,729 - INFO - Finished converting document 4_2025-09-05 in 0.06 sec.
2025-11-14 16:54:33,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:33,800 - INFO - Going to convert document batch...
2025-11-14 16:54:33,800 - INFO - Processing document 4_2025-09-11
2025-11-14 16:54:33,821 - INFO - Finished converting document 4_2025-09-11 in 0.05 sec.
2025-11-14 16:54:33,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:33,872 - INFO - Going to convert document batch...
2025-11-14 16:54:33,873 - INFO - Processing document 4_2025-10-20
2025-11-14 16:54:33,904 - INFO - Finished converting document 4_2025-10-20 in 0.06 sec.
2025-11-14 16:54:33,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\4_2025-09-05' --> 'data\processed_data\JNJ\4_2025-09-05.md'
Converted 'data\edgar_documents\JNJ\4_2025-09-11' --> 'data\processed_data\JNJ\4_2025-09-11.md'
Converted 'data\edgar_documents\JNJ\4_2025-10-20' --> 'data\processed_data\JNJ\4_2025-10-20.md'


2025-11-14 16:54:33,968 - INFO - Going to convert document batch...
2025-11-14 16:54:33,970 - INFO - Processing document 4_2025-11-10
2025-11-14 16:54:34,091 - INFO - Finished converting document 4_2025-11-10 in 0.17 sec.
2025-11-14 16:54:34,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:34,222 - INFO - Going to convert document batch...
2025-11-14 16:54:34,223 - INFO - Processing document 8-K_2023-01-24
2025-11-14 16:54:34,252 - INFO - Finished converting document 8-K_2023-01-24 in 0.11 sec.
2025-11-14 16:54:34,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:34,321 - INFO - Going to convert document batch...
2025-11-14 16:54:34,322 - INFO - Processing document 8-K_2023-02-14


Converted 'data\edgar_documents\JNJ\4_2025-11-10' --> 'data\processed_data\JNJ\4_2025-11-10.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-01-24' --> 'data\processed_data\JNJ\8-K_2023-01-24.md'


2025-11-14 16:54:34,340 - INFO - Finished converting document 8-K_2023-02-14 in 0.08 sec.
2025-11-14 16:54:34,370 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:34,392 - INFO - Going to convert document batch...
2025-11-14 16:54:34,393 - INFO - Processing document 8-K_2023-02-15
2025-11-14 16:54:34,417 - INFO - Finished converting document 8-K_2023-02-15 in 0.08 sec.
2025-11-14 16:54:34,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:34,487 - INFO - Going to convert document batch...
2025-11-14 16:54:34,488 - INFO - Processing document 8-K_2023-04-03
2025-11-14 16:54:34,506 - INFO - Finished converting document 8-K_2023-04-03 in 0.08 sec.
2025-11-14 16:54:34,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\8-K_2023-02-14' --> 'data\processed_data\JNJ\8-K_2023-02-14.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-02-15' --> 'data\processed_data\JNJ\8-K_2023-02-15.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-04-03' --> 'data\processed_data\JNJ\8-K_2023-04-03.md'


2025-11-14 16:54:34,558 - INFO - Going to convert document batch...
2025-11-14 16:54:34,559 - INFO - Processing document 8-K_2023-04-04
2025-11-14 16:54:34,587 - INFO - Finished converting document 8-K_2023-04-04 in 0.06 sec.
2025-11-14 16:54:34,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:34,646 - INFO - Going to convert document batch...
2025-11-14 16:54:34,666 - INFO - Processing document 8-K_2023-04-18
2025-11-14 16:54:34,738 - INFO - Finished converting document 8-K_2023-04-18 in 0.14 sec.
2025-11-14 16:54:34,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\8-K_2023-04-04' --> 'data\processed_data\JNJ\8-K_2023-04-04.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-04-18' --> 'data\processed_data\JNJ\8-K_2023-04-18.md'


2025-11-14 16:54:34,826 - INFO - Going to convert document batch...
2025-11-14 16:54:34,827 - INFO - Processing document 8-K_2023-05-01
2025-11-14 16:54:34,870 - INFO - Finished converting document 8-K_2023-05-01 in 0.12 sec.
2025-11-14 16:54:34,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:34,926 - INFO - Going to convert document batch...
2025-11-14 16:54:34,928 - INFO - Processing document 8-K_2023-05-08


Converted 'data\edgar_documents\JNJ\8-K_2023-05-01' --> 'data\processed_data\JNJ\8-K_2023-05-01.md'


2025-11-14 16:54:35,258 - INFO - Finished converting document 8-K_2023-05-08 in 0.36 sec.
2025-11-14 16:54:35,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:35,408 - INFO - Going to convert document batch...
2025-11-14 16:54:35,410 - INFO - Processing document 8-K_2023-07-20
2025-11-14 16:54:35,447 - INFO - Finished converting document 8-K_2023-07-20 in 0.17 sec.


Converted 'data\edgar_documents\JNJ\8-K_2023-05-08' --> 'data\processed_data\JNJ\8-K_2023-05-08.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-07-20' --> 'data\processed_data\JNJ\8-K_2023-07-20.md'


2025-11-14 16:54:35,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:35,524 - INFO - Going to convert document batch...
2025-11-14 16:54:35,525 - INFO - Processing document 8-K_2023-07-24
2025-11-14 16:54:35,549 - INFO - Finished converting document 8-K_2023-07-24 in 0.09 sec.
2025-11-14 16:54:35,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:35,603 - INFO - Going to convert document batch...
2025-11-14 16:54:35,604 - INFO - Processing document 8-K_2023-07-28
2025-11-14 16:54:35,624 - INFO - Finished converting document 8-K_2023-07-28 in 0.06 sec.
2025-11-14 16:54:35,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:35,684 - INFO - Going to convert document batch...
2025-11-14 16:54:35,685 - INFO - Processing document 8-K_2023-08-25
2025-11-14 16:54:35,700 - INFO - Finished converting document 8-K_2023-08-25 in 0.08 sec.
2025-11-14 16:54:35,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\JNJ\8-K_2023-07-24' --> 'data\processed_data\JNJ\8-K_2023-07-24.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-07-28' --> 'data\processed_data\JNJ\8-K_2023-07-28.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-08-25' --> 'data\processed_data\JNJ\8-K_2023-08-25.md'


2025-11-14 16:54:35,761 - INFO - Processing document 8-K_2023-08-30
2025-11-14 16:54:35,783 - INFO - Finished converting document 8-K_2023-08-30 in 0.08 sec.
2025-11-14 16:54:35,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:35,933 - INFO - Going to convert document batch...
2025-11-14 16:54:35,934 - INFO - Processing document 8-K_2023-10-17
2025-11-14 16:54:35,953 - INFO - Finished converting document 8-K_2023-10-17 in 0.09 sec.
2025-11-14 16:54:35,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,021 - INFO - Going to convert document batch...
2025-11-14 16:54:36,022 - INFO - Processing document 8-K_2023-10-23
2025-11-14 16:54:36,044 - INFO - Finished converting document 8-K_2023-10-23 in 0.09 sec.


Converted 'data\edgar_documents\JNJ\8-K_2023-08-30' --> 'data\processed_data\JNJ\8-K_2023-08-30.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-10-17' --> 'data\processed_data\JNJ\8-K_2023-10-17.md'


2025-11-14 16:54:36,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,107 - INFO - Going to convert document batch...
2025-11-14 16:54:36,108 - INFO - Processing document 8-K_2023-11-27
2025-11-14 16:54:36,138 - INFO - Finished converting document 8-K_2023-11-27 in 0.09 sec.
2025-11-14 16:54:36,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,219 - INFO - Going to convert document batch...
2025-11-14 16:54:36,220 - INFO - Processing document 8-K_2023-11-30


Converted 'data\edgar_documents\JNJ\8-K_2023-10-23' --> 'data\processed_data\JNJ\8-K_2023-10-23.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-11-27' --> 'data\processed_data\JNJ\8-K_2023-11-27.md'


2025-11-14 16:54:36,241 - INFO - Finished converting document 8-K_2023-11-30 in 0.08 sec.
2025-11-14 16:54:36,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,284 - INFO - Going to convert document batch...
2025-11-14 16:54:36,285 - INFO - Processing document 8-K_2023-12-05
2025-11-14 16:54:36,317 - INFO - Finished converting document 8-K_2023-12-05 in 0.06 sec.
2025-11-14 16:54:36,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,374 - INFO - Going to convert document batch...
2025-11-14 16:54:36,376 - INFO - Processing document 8-K_2024-01-23
2025-11-14 16:54:36,400 - INFO - Finished converting document 8-K_2024-01-23 in 0.08 sec.
2025-11-14 16:54:36,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\8-K_2023-11-30' --> 'data\processed_data\JNJ\8-K_2023-11-30.md'
Converted 'data\edgar_documents\JNJ\8-K_2023-12-05' --> 'data\processed_data\JNJ\8-K_2023-12-05.md'
Converted 'data\edgar_documents\JNJ\8-K_2024-01-23' --> 'data\processed_data\JNJ\8-K_2024-01-23.md'


2025-11-14 16:54:36,455 - INFO - Going to convert document batch...
2025-11-14 16:54:36,455 - INFO - Processing document 8-K_2024-04-16
2025-11-14 16:54:36,479 - INFO - Finished converting document 8-K_2024-04-16 in 0.08 sec.
2025-11-14 16:54:36,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,547 - INFO - Going to convert document batch...
2025-11-14 16:54:36,547 - INFO - Processing document 8-K_2024-04-29
2025-11-14 16:54:36,582 - INFO - Finished converting document 8-K_2024-04-29 in 0.09 sec.
2025-11-14 16:54:36,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,646 - INFO - Going to convert document batch...
2025-11-14 16:54:36,646 - INFO - Processing document 8-K_2024-05-01
2025-11-14 16:54:36,674 - INFO - Finished converting document 8-K_2024-05-01 in 0.08 sec.


Converted 'data\edgar_documents\JNJ\8-K_2024-04-16' --> 'data\processed_data\JNJ\8-K_2024-04-16.md'
Converted 'data\edgar_documents\JNJ\8-K_2024-04-29' --> 'data\processed_data\JNJ\8-K_2024-04-29.md'


2025-11-14 16:54:36,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,731 - INFO - Going to convert document batch...
2025-11-14 16:54:36,732 - INFO - Processing document 8-K_2024-05-17
2025-11-14 16:54:36,761 - INFO - Finished converting document 8-K_2024-05-17 in 0.08 sec.
2025-11-14 16:54:36,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,831 - INFO - Going to convert document batch...
2025-11-14 16:54:36,832 - INFO - Processing document 8-K_2024-05-20
2025-11-14 16:54:36,872 - INFO - Finished converting document 8-K_2024-05-20 in 0.11 sec.


Converted 'data\edgar_documents\JNJ\8-K_2024-05-01' --> 'data\processed_data\JNJ\8-K_2024-05-01.md'
Converted 'data\edgar_documents\JNJ\8-K_2024-05-17' --> 'data\processed_data\JNJ\8-K_2024-05-17.md'


2025-11-14 16:54:36,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:36,940 - INFO - Going to convert document batch...
2025-11-14 16:54:36,941 - INFO - Processing document 8-K_2024-07-17
2025-11-14 16:54:36,978 - INFO - Finished converting document 8-K_2024-07-17 in 0.08 sec.
2025-11-14 16:54:37,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:37,038 - INFO - Going to convert document batch...
2025-11-14 16:54:37,039 - INFO - Processing document 8-K_2024-08-26
2025-11-14 16:54:37,068 - INFO - Finished converting document 8-K_2024-08-26 in 0.08 sec.


Converted 'data\edgar_documents\JNJ\8-K_2024-05-20' --> 'data\processed_data\JNJ\8-K_2024-05-20.md'
Converted 'data\edgar_documents\JNJ\8-K_2024-07-17' --> 'data\processed_data\JNJ\8-K_2024-07-17.md'


2025-11-14 16:54:37,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:37,120 - INFO - Going to convert document batch...
2025-11-14 16:54:37,121 - INFO - Processing document 8-K_2024-09-10
2025-11-14 16:54:37,153 - INFO - Finished converting document 8-K_2024-09-10 in 0.08 sec.
2025-11-14 16:54:37,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:37,222 - INFO - Going to convert document batch...
2025-11-14 16:54:37,222 - INFO - Processing document 8-K_2024-09-20
2025-11-14 16:54:37,250 - INFO - Finished converting document 8-K_2024-09-20 in 0.06 sec.
2025-11-14 16:54:37,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\8-K_2024-08-26' --> 'data\processed_data\JNJ\8-K_2024-08-26.md'
Converted 'data\edgar_documents\JNJ\8-K_2024-09-10' --> 'data\processed_data\JNJ\8-K_2024-09-10.md'
Converted 'data\edgar_documents\JNJ\8-K_2024-09-20' --> 'data\processed_data\JNJ\8-K_2024-09-20.md'


2025-11-14 16:54:37,301 - INFO - Going to convert document batch...
2025-11-14 16:54:37,301 - INFO - Processing document 8-K_2024-10-15
2025-11-14 16:54:37,326 - INFO - Finished converting document 8-K_2024-10-15 in 0.06 sec.
2025-11-14 16:54:37,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:37,374 - INFO - Going to convert document batch...
2025-11-14 16:54:37,375 - INFO - Processing document 8-K_2025-01-22
2025-11-14 16:54:37,398 - INFO - Finished converting document 8-K_2025-01-22 in 0.05 sec.
2025-11-14 16:54:37,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:37,450 - INFO - Going to convert document batch...
2025-11-14 16:54:37,451 - INFO - Processing document 8-K_2025-02-20
2025-11-14 16:54:37,492 - INFO - Finished converting document 8-K_2025-02-20 in 0.08 sec.
2025-11-14 16:54:37,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\8-K_2024-10-15' --> 'data\processed_data\JNJ\8-K_2024-10-15.md'
Converted 'data\edgar_documents\JNJ\8-K_2025-01-22' --> 'data\processed_data\JNJ\8-K_2025-01-22.md'
Converted 'data\edgar_documents\JNJ\8-K_2025-02-20' --> 'data\processed_data\JNJ\8-K_2025-02-20.md'


2025-11-14 16:54:37,552 - INFO - Going to convert document batch...
2025-11-14 16:54:37,553 - INFO - Processing document 8-K_2025-02-26
2025-11-14 16:54:37,595 - INFO - Finished converting document 8-K_2025-02-26 in 0.08 sec.
2025-11-14 16:54:37,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:37,640 - INFO - Going to convert document batch...
2025-11-14 16:54:37,641 - INFO - Processing document 8-K_2025-04-03
2025-11-14 16:54:37,670 - INFO - Finished converting document 8-K_2025-04-03 in 0.06 sec.
2025-11-14 16:54:37,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:37,717 - INFO - Going to convert document batch...
2025-11-14 16:54:37,718 - INFO - Processing document 8-K_2025-04-15
2025-11-14 16:54:37,751 - INFO - Finished converting document 8-K_2025-04-15 in 0.06 sec.
2025-11-14 16:54:37,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\8-K_2025-02-26' --> 'data\processed_data\JNJ\8-K_2025-02-26.md'
Converted 'data\edgar_documents\JNJ\8-K_2025-04-03' --> 'data\processed_data\JNJ\8-K_2025-04-03.md'
Converted 'data\edgar_documents\JNJ\8-K_2025-04-15' --> 'data\processed_data\JNJ\8-K_2025-04-15.md'


2025-11-14 16:54:37,814 - INFO - Going to convert document batch...
2025-11-14 16:54:37,815 - INFO - Processing document 8-K_2025-04-30
2025-11-14 16:54:37,876 - INFO - Finished converting document 8-K_2025-04-30 in 0.11 sec.
2025-11-14 16:54:37,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:38,017 - INFO - Going to convert document batch...
2025-11-14 16:54:38,018 - INFO - Processing document 8-K_2025-06-10
2025-11-14 16:54:38,046 - INFO - Finished converting document 8-K_2025-06-10 in 0.16 sec.


Converted 'data\edgar_documents\JNJ\8-K_2025-04-30' --> 'data\processed_data\JNJ\8-K_2025-04-30.md'
Converted 'data\edgar_documents\JNJ\8-K_2025-06-10' --> 'data\processed_data\JNJ\8-K_2025-06-10.md'


2025-11-14 16:54:38,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:38,136 - INFO - Going to convert document batch...
2025-11-14 16:54:38,137 - INFO - Processing document 8-K_2025-07-16
2025-11-14 16:54:38,176 - INFO - Finished converting document 8-K_2025-07-16 in 0.12 sec.
2025-11-14 16:54:38,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:38,251 - INFO - Going to convert document batch...
2025-11-14 16:54:38,252 - INFO - Processing document 8-K_2025-09-09
2025-11-14 16:54:38,289 - INFO - Finished converting document 8-K_2025-09-09 in 0.08 sec.
2025-11-14 16:54:38,343 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:54:38,369 - INFO - Going to convert document batch...
2025-11-14 16:54:38,370 - INFO - Processing document 8-K_2025-10-14


Converted 'data\edgar_documents\JNJ\8-K_2025-07-16' --> 'data\processed_data\JNJ\8-K_2025-07-16.md'
Converted 'data\edgar_documents\JNJ\8-K_2025-09-09' --> 'data\processed_data\JNJ\8-K_2025-09-09.md'


2025-11-14 16:54:38,397 - INFO - Finished converting document 8-K_2025-10-14 in 0.08 sec.
2025-11-14 16:54:38,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\8-K_2025-10-14' --> 'data\processed_data\JNJ\8-K_2025-10-14.md'


2025-11-14 16:54:39,537 - INFO - Going to convert document batch...
2025-11-14 16:54:39,538 - INFO - Processing document DEF-14A_2023-03-15
2025-11-14 16:54:43,500 - INFO - Finished converting document DEF-14A_2023-03-15 in 5.09 sec.
2025-11-14 16:54:47,176 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\DEF-14A_2023-03-15' --> 'data\processed_data\JNJ\DEF-14A_2023-03-15.md'


2025-11-14 16:54:48,052 - INFO - Going to convert document batch...
2025-11-14 16:54:48,053 - INFO - Processing document DEF-14A_2024-03-13
2025-11-14 16:54:53,861 - INFO - Finished converting document DEF-14A_2024-03-13 in 6.80 sec.
2025-11-14 16:54:55,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\DEF-14A_2024-03-13' --> 'data\processed_data\JNJ\DEF-14A_2024-03-13.md'


2025-11-14 16:54:56,828 - INFO - Going to convert document batch...
2025-11-14 16:54:56,829 - INFO - Processing document DEF-14A_2025-03-12
2025-11-14 16:55:02,597 - INFO - Finished converting document DEF-14A_2025-03-12 in 7.11 sec.
2025-11-14 16:55:04,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\JNJ\DEF-14A_2025-03-12' --> 'data\processed_data\JNJ\DEF-14A_2025-03-12.md'
Processed 103 new files. Errors: 27
Found 126 files to process in data\edgar_documents\KO


2025-11-14 16:55:05,979 - INFO - Going to convert document batch...
2025-11-14 16:55:05,980 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:55:05,980 - INFO - Processing document 10-K_2023-02-21
2025-11-14 16:55:09,224 - INFO - Finished converting document 10-K_2023-02-21 in 5.05 sec.
2025-11-14 16:55:10,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-K_2023-02-21' --> 'data\processed_data\KO\10-K_2023-02-21.md'


2025-11-14 16:55:11,111 - INFO - Going to convert document batch...
2025-11-14 16:55:11,111 - INFO - Processing document 10-K_2024-02-20
2025-11-14 16:55:14,508 - INFO - Finished converting document 10-K_2024-02-20 in 4.41 sec.
2025-11-14 16:55:15,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-K_2024-02-20' --> 'data\processed_data\KO\10-K_2024-02-20.md'


2025-11-14 16:55:16,370 - INFO - Going to convert document batch...
2025-11-14 16:55:16,371 - INFO - Processing document 10-K_2025-02-20
2025-11-14 16:55:19,997 - INFO - Finished converting document 10-K_2025-02-20 in 4.61 sec.
2025-11-14 16:55:20,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-K_2025-02-20' --> 'data\processed_data\KO\10-K_2025-02-20.md'


2025-11-14 16:55:21,813 - INFO - Going to convert document batch...
2025-11-14 16:55:21,814 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 16:55:22,574 - INFO - Finished converting document 10-Q_2023-04-26 in 1.67 sec.
2025-11-14 16:55:23,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-Q_2023-04-26' --> 'data\processed_data\KO\10-Q_2023-04-26.md'


2025-11-14 16:55:23,516 - INFO - Going to convert document batch...
2025-11-14 16:55:23,519 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 16:55:24,639 - INFO - Finished converting document 10-Q_2023-07-27 in 1.70 sec.
2025-11-14 16:55:25,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-Q_2023-07-27' --> 'data\processed_data\KO\10-Q_2023-07-27.md'


2025-11-14 16:55:26,648 - INFO - Going to convert document batch...
2025-11-14 16:55:26,648 - INFO - Processing document 10-Q_2023-10-24
2025-11-14 16:55:28,068 - INFO - Finished converting document 10-Q_2023-10-24 in 2.77 sec.
2025-11-14 16:55:28,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-Q_2023-10-24' --> 'data\processed_data\KO\10-Q_2023-10-24.md'


2025-11-14 16:55:29,286 - INFO - Going to convert document batch...
2025-11-14 16:55:29,286 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 16:55:30,116 - INFO - Finished converting document 10-Q_2024-05-02 in 1.53 sec.
2025-11-14 16:55:30,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:30,583 - INFO - Going to convert document batch...
2025-11-14 16:55:30,584 - INFO - Processing document 10-Q_2024-05-30
2025-11-14 16:55:30,615 - INFO - Finished converting document 10-Q_2024-05-30 in 0.11 sec.
2025-11-14 16:55:30,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-Q_2024-05-02' --> 'data\processed_data\KO\10-Q_2024-05-02.md'
Converted 'data\edgar_documents\KO\10-Q_2024-05-30' --> 'data\processed_data\KO\10-Q_2024-05-30.md'


2025-11-14 16:55:31,184 - INFO - Going to convert document batch...
2025-11-14 16:55:31,185 - INFO - Processing document 10-Q_2024-07-29
2025-11-14 16:55:32,409 - INFO - Finished converting document 10-Q_2024-07-29 in 1.77 sec.
2025-11-14 16:55:33,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-Q_2024-07-29' --> 'data\processed_data\KO\10-Q_2024-07-29.md'


2025-11-14 16:55:34,072 - INFO - Going to convert document batch...
2025-11-14 16:55:34,073 - INFO - Processing document 10-Q_2024-10-24
2025-11-14 16:55:35,257 - INFO - Finished converting document 10-Q_2024-10-24 in 2.25 sec.
2025-11-14 16:55:35,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-Q_2024-10-24' --> 'data\processed_data\KO\10-Q_2024-10-24.md'


2025-11-14 16:55:36,315 - INFO - Going to convert document batch...
2025-11-14 16:55:36,316 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 16:55:37,069 - INFO - Finished converting document 10-Q_2025-05-01 in 1.17 sec.
2025-11-14 16:55:37,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-Q_2025-05-01' --> 'data\processed_data\KO\10-Q_2025-05-01.md'


2025-11-14 16:55:38,561 - INFO - Going to convert document batch...
2025-11-14 16:55:38,562 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 16:55:39,930 - INFO - Finished converting document 10-Q_2025-07-24 in 2.50 sec.
2025-11-14 16:55:40,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-Q_2025-07-24' --> 'data\processed_data\KO\10-Q_2025-07-24.md'


2025-11-14 16:55:41,313 - INFO - Going to convert document batch...
2025-11-14 16:55:41,314 - INFO - Processing document 10-Q_2025-10-23
2025-11-14 16:55:42,767 - INFO - Finished converting document 10-Q_2025-10-23 in 2.31 sec.
2025-11-14 16:55:43,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:43,473 - INFO - Going to convert document batch...
2025-11-14 16:55:43,474 - INFO - Processing document 4_2023-01-19
2025-11-14 16:55:43,502 - INFO - Finished converting document 4_2023-01-19 in 0.06 sec.
2025-11-14 16:55:43,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:43,563 - INFO - Going to convert document batch...
2025-11-14 16:55:43,564 - INFO - Processing document 4_2023-02-15
2025-11-14 16:55:43,589 - INFO - Finished converting document 4_2023-02-15 in 0.06 sec.
2025-11-14 16:55:43,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\10-Q_2025-10-23' --> 'data\processed_data\KO\10-Q_2025-10-23.md'
Converted 'data\edgar_documents\KO\4_2023-01-19' --> 'data\processed_data\KO\4_2023-01-19.md'
Converted 'data\edgar_documents\KO\4_2023-02-15' --> 'data\processed_data\KO\4_2023-02-15.md'


2025-11-14 16:55:43,637 - INFO - Going to convert document batch...
2025-11-14 16:55:43,638 - INFO - Processing document 4_2023-02-21
2025-11-14 16:55:43,676 - INFO - Finished converting document 4_2023-02-21 in 0.06 sec.
2025-11-14 16:55:43,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:43,748 - INFO - Going to convert document batch...
2025-11-14 16:55:43,748 - INFO - Processing document 4_2023-02-23
2025-11-14 16:55:43,775 - INFO - Finished converting document 4_2023-02-23 in 0.05 sec.
2025-11-14 16:55:43,816 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:43,830 - INFO - Going to convert document batch...
2025-11-14 16:55:43,830 - INFO - Processing document 4_2023-03-01
2025-11-14 16:55:43,855 - INFO - Finished converting document 4_2023-03-01 in 0.06 sec.
2025-11-14 16:55:43,890 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:43,898 - INFO - Going to convert document batch...
2025-11-14 16:55:43,899 - 

Converted 'data\edgar_documents\KO\4_2023-02-21' --> 'data\processed_data\KO\4_2023-02-21.md'
Converted 'data\edgar_documents\KO\4_2023-02-23' --> 'data\processed_data\KO\4_2023-02-23.md'
Converted 'data\edgar_documents\KO\4_2023-03-01' --> 'data\processed_data\KO\4_2023-03-01.md'


2025-11-14 16:55:43,921 - INFO - Finished converting document 4_2023-03-03 in 0.05 sec.
2025-11-14 16:55:43,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:43,981 - INFO - Going to convert document batch...
2025-11-14 16:55:43,981 - INFO - Processing document 4_2023-03-09
2025-11-14 16:55:44,021 - INFO - Finished converting document 4_2023-03-09 in 0.06 sec.
2025-11-14 16:55:44,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:44,132 - INFO - Going to convert document batch...
2025-11-14 16:55:44,133 - INFO - Processing document 4_2023-04-04


Converted 'data\edgar_documents\KO\4_2023-03-03' --> 'data\processed_data\KO\4_2023-03-03.md'
Converted 'data\edgar_documents\KO\4_2023-03-09' --> 'data\processed_data\KO\4_2023-03-09.md'


2025-11-14 16:55:44,174 - INFO - Finished converting document 4_2023-04-04 in 0.11 sec.
2025-11-14 16:55:44,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:44,334 - INFO - Going to convert document batch...
2025-11-14 16:55:44,337 - INFO - Processing document 4_2023-05-02
2025-11-14 16:55:44,371 - INFO - Finished converting document 4_2023-05-02 in 0.16 sec.


Converted 'data\edgar_documents\KO\4_2023-04-04' --> 'data\processed_data\KO\4_2023-04-04.md'


2025-11-14 16:55:44,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:44,463 - INFO - Going to convert document batch...
2025-11-14 16:55:44,464 - INFO - Processing document 4_2023-05-03
2025-11-14 16:55:44,508 - INFO - Finished converting document 4_2023-05-03 in 0.09 sec.
2025-11-14 16:55:44,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\4_2023-05-02' --> 'data\processed_data\KO\4_2023-05-02.md'
Converted 'data\edgar_documents\KO\4_2023-05-03' --> 'data\processed_data\KO\4_2023-05-03.md'


2025-11-14 16:55:44,618 - INFO - Going to convert document batch...
2025-11-14 16:55:44,619 - INFO - Processing document 4_2023-05-08
2025-11-14 16:55:44,656 - INFO - Finished converting document 4_2023-05-08 in 0.11 sec.
2025-11-14 16:55:44,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:44,763 - INFO - Going to convert document batch...
2025-11-14 16:55:44,764 - INFO - Processing document 4_2023-05-15
2025-11-14 16:55:44,798 - INFO - Finished converting document 4_2023-05-15 in 0.09 sec.
2025-11-14 16:55:44,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\4_2023-05-08' --> 'data\processed_data\KO\4_2023-05-08.md'
Converted 'data\edgar_documents\KO\4_2023-05-15' --> 'data\processed_data\KO\4_2023-05-15.md'


2025-11-14 16:55:44,899 - INFO - Going to convert document batch...
2025-11-14 16:55:44,900 - INFO - Processing document 4_2023-05-16
2025-11-14 16:55:45,031 - INFO - Finished converting document 4_2023-05-16 in 0.19 sec.
2025-11-14 16:55:45,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:45,090 - INFO - Going to convert document batch...
2025-11-14 16:55:45,091 - INFO - Processing document 4_2023-06-12
2025-11-14 16:55:45,119 - INFO - Finished converting document 4_2023-06-12 in 0.05 sec.
2025-11-14 16:55:45,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:45,170 - INFO - Going to convert document batch...
2025-11-14 16:55:45,171 - INFO - Processing document 4_2023-07-05
2025-11-14 16:55:45,195 - INFO - Finished converting document 4_2023-07-05 in 0.05 sec.
2025-11-14 16:55:45,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\4_2023-05-16' --> 'data\processed_data\KO\4_2023-05-16.md'
Converted 'data\edgar_documents\KO\4_2023-06-12' --> 'data\processed_data\KO\4_2023-06-12.md'
Converted 'data\edgar_documents\KO\4_2023-07-05' --> 'data\processed_data\KO\4_2023-07-05.md'


2025-11-14 16:55:45,261 - INFO - Going to convert document batch...
2025-11-14 16:55:45,262 - INFO - Processing document 4_2023-07-21
2025-11-14 16:55:45,305 - INFO - Finished converting document 4_2023-07-21 in 0.06 sec.
2025-11-14 16:55:45,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:45,403 - INFO - Going to convert document batch...
2025-11-14 16:55:45,404 - INFO - Processing document 4_2023-07-28
2025-11-14 16:55:45,432 - INFO - Finished converting document 4_2023-07-28 in 0.09 sec.
2025-11-14 16:55:45,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:45,496 - INFO - Going to convert document batch...
2025-11-14 16:55:45,497 - INFO - Processing document 4_2023-08-04
2025-11-14 16:55:45,536 - INFO - Finished converting document 4_2023-08-04 in 0.06 sec.


Converted 'data\edgar_documents\KO\4_2023-07-21' --> 'data\processed_data\KO\4_2023-07-21.md'
Converted 'data\edgar_documents\KO\4_2023-07-28' --> 'data\processed_data\KO\4_2023-07-28.md'


2025-11-14 16:55:45,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:45,611 - INFO - Going to convert document batch...
2025-11-14 16:55:45,612 - INFO - Processing document 4_2023-08-14
2025-11-14 16:55:45,645 - INFO - Finished converting document 4_2023-08-14 in 0.06 sec.


Converted 'data\edgar_documents\KO\4_2023-08-04' --> 'data\processed_data\KO\4_2023-08-04.md'
Converted 'data\edgar_documents\KO\4_2023-08-14' --> 'data\processed_data\KO\4_2023-08-14.md'


2025-11-14 16:55:45,806 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:45,824 - INFO - Going to convert document batch...
2025-11-14 16:55:45,825 - INFO - Processing document 4_2023-09-20
2025-11-14 16:55:45,864 - INFO - Finished converting document 4_2023-09-20 in 0.11 sec.
2025-11-14 16:55:45,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:45,939 - INFO - Going to convert document batch...
2025-11-14 16:55:45,940 - INFO - Processing document 4_2023-10-19
2025-11-14 16:55:45,961 - INFO - Finished converting document 4_2023-10-19 in 0.05 sec.
2025-11-14 16:55:45,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:46,007 - INFO - Going to convert document batch...
2025-11-14 16:55:46,007 - INFO - Processing document 4_2023-10-30
2025-11-14 16:55:46,041 - INFO - Finished converting document 4_2023-10-30 in 0.05 sec.
2025-11-14 16:55:46,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\KO\4_2023-09-20' --> 'data\processed_data\KO\4_2023-09-20.md'
Converted 'data\edgar_documents\KO\4_2023-10-19' --> 'data\processed_data\KO\4_2023-10-19.md'
Converted 'data\edgar_documents\KO\4_2023-10-30' --> 'data\processed_data\KO\4_2023-10-30.md'


2025-11-14 16:55:46,097 - INFO - Processing document 4_2023-11-20
2025-11-14 16:55:46,132 - INFO - Finished converting document 4_2023-11-20 in 0.06 sec.
2025-11-14 16:55:46,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:46,230 - INFO - Going to convert document batch...
2025-11-14 16:55:46,231 - INFO - Processing document 4_2023-12-13
2025-11-14 16:55:46,261 - INFO - Finished converting document 4_2023-12-13 in 0.09 sec.
2025-11-14 16:55:46,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:46,342 - INFO - Going to convert document batch...
2025-11-14 16:55:46,343 - INFO - Processing document 4_2023-12-20


Converted 'data\edgar_documents\KO\4_2023-11-20' --> 'data\processed_data\KO\4_2023-11-20.md'
Converted 'data\edgar_documents\KO\4_2023-12-13' --> 'data\processed_data\KO\4_2023-12-13.md'


2025-11-14 16:55:46,375 - INFO - Finished converting document 4_2023-12-20 in 0.08 sec.
2025-11-14 16:55:46,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:46,439 - INFO - Going to convert document batch...
2025-11-14 16:55:46,440 - INFO - Processing document 4_2023-12-21
2025-11-14 16:55:46,564 - INFO - Finished converting document 4_2023-12-21 in 0.16 sec.


Converted 'data\edgar_documents\KO\4_2023-12-20' --> 'data\processed_data\KO\4_2023-12-20.md'
Converted 'data\edgar_documents\KO\4_2023-12-21' --> 'data\processed_data\KO\4_2023-12-21.md'


2025-11-14 16:55:46,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:46,665 - INFO - Going to convert document batch...
2025-11-14 16:55:46,666 - INFO - Processing document 4_2024-02-01
2025-11-14 16:55:46,699 - INFO - Finished converting document 4_2024-02-01 in 0.11 sec.
2025-11-14 16:55:46,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:46,794 - INFO - Going to convert document batch...
2025-11-14 16:55:46,794 - INFO - Processing document 4_2024-02-14
2025-11-14 16:55:46,818 - INFO - Finished converting document 4_2024-02-14 in 0.08 sec.
2025-11-14 16:55:46,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:46,865 - INFO - Going to convert document batch...
2025-11-14 16:55:46,866 - INFO - Processing document 4_2024-02-20
2025-11-14 16:55:46,895 - INFO - Finished converting document 4_2024-02-20 in 0.05 sec.


Converted 'data\edgar_documents\KO\4_2024-02-01' --> 'data\processed_data\KO\4_2024-02-01.md'
Converted 'data\edgar_documents\KO\4_2024-02-14' --> 'data\processed_data\KO\4_2024-02-14.md'


2025-11-14 16:55:46,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:46,945 - INFO - Going to convert document batch...
2025-11-14 16:55:46,945 - INFO - Processing document 4_2024-02-26
2025-11-14 16:55:47,052 - INFO - Finished converting document 4_2024-02-26 in 0.12 sec.


Converted 'data\edgar_documents\KO\4_2024-02-20' --> 'data\processed_data\KO\4_2024-02-20.md'
Converted 'data\edgar_documents\KO\4_2024-02-26' --> 'data\processed_data\KO\4_2024-02-26.md'


2025-11-14 16:55:47,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:47,171 - INFO - Going to convert document batch...
2025-11-14 16:55:47,172 - INFO - Processing document 4_2024-02-28
2025-11-14 16:55:47,204 - INFO - Finished converting document 4_2024-02-28 in 0.12 sec.
2025-11-14 16:55:47,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:47,259 - INFO - Going to convert document batch...
2025-11-14 16:55:47,259 - INFO - Processing document 4_2024-03-01
2025-11-14 16:55:47,282 - INFO - Finished converting document 4_2024-03-01 in 0.05 sec.
2025-11-14 16:55:47,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:47,330 - INFO - Going to convert document batch...
2025-11-14 16:55:47,331 - INFO - Processing document 4_2024-03-06
2025-11-14 16:55:47,352 - INFO - Finished converting document 4_2024-03-06 in 0.03 sec.
2025-11-14 16:55:47,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\KO\4_2024-02-28' --> 'data\processed_data\KO\4_2024-02-28.md'
Converted 'data\edgar_documents\KO\4_2024-03-01' --> 'data\processed_data\KO\4_2024-03-01.md'
Converted 'data\edgar_documents\KO\4_2024-03-06' --> 'data\processed_data\KO\4_2024-03-06.md'


2025-11-14 16:55:47,448 - INFO - Finished converting document 4_2024-03-12 in 0.08 sec.
2025-11-14 16:55:47,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:47,560 - INFO - Going to convert document batch...
2025-11-14 16:55:47,561 - INFO - Processing document 4_2024-03-15
2025-11-14 16:55:47,597 - INFO - Finished converting document 4_2024-03-15 in 0.11 sec.
2025-11-14 16:55:47,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\4_2024-03-12' --> 'data\processed_data\KO\4_2024-03-12.md'
Converted 'data\edgar_documents\KO\4_2024-03-15' --> 'data\processed_data\KO\4_2024-03-15.md'


2025-11-14 16:55:47,702 - INFO - Going to convert document batch...
2025-11-14 16:55:47,703 - INFO - Processing document 4_2024-04-03
2025-11-14 16:55:47,739 - INFO - Finished converting document 4_2024-04-03 in 0.11 sec.
2025-11-14 16:55:47,797 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:55:47,798 - ERROR - Input document 4_2024-05-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:55:47,799 - INFO - Going to convert document batch...
2025-11-14 16:55:47,813 - IN

Converted 'data\edgar_documents\KO\4_2024-04-03' --> 'data\processed_data\KO\4_2024-04-03.md'
Error processing data\edgar_documents\KO\4_2024-05-06: File format not allowed: data\edgar_documents\KO\4_2024-05-06


2025-11-14 16:55:48,032 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:55:48,033 - ERROR - Input document 4_2024-05-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:55:48,035 - INFO - Going to convert document batch...
2025-11-14 16:55:48,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:48,061 - INFO - Going to convert document batch...
2025-11-14 16:55:48,062 - INFO - Processing document 4_2024-05-09
2025-11-14 16:55:48,100 - INFO - Fin

Converted 'data\edgar_documents\KO\4_2024-05-07' --> 'data\processed_data\KO\4_2024-05-07.md'
Error processing data\edgar_documents\KO\4_2024-05-08: File format not allowed: data\edgar_documents\KO\4_2024-05-08
Converted 'data\edgar_documents\KO\4_2024-05-09' --> 'data\processed_data\KO\4_2024-05-09.md'


2025-11-14 16:55:48,193 - INFO - Finished converting document 4_2024-05-10 in 0.06 sec.
2025-11-14 16:55:48,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:48,259 - INFO - Going to convert document batch...
2025-11-14 16:55:48,260 - INFO - Processing document 4_2024-05-14
2025-11-14 16:55:48,366 - INFO - Finished converting document 4_2024-05-14 in 0.14 sec.


Converted 'data\edgar_documents\KO\4_2024-05-10' --> 'data\processed_data\KO\4_2024-05-10.md'


2025-11-14 16:55:48,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:48,450 - INFO - Going to convert document batch...
2025-11-14 16:55:48,451 - INFO - Processing document 4_2024-05-16
2025-11-14 16:55:48,481 - INFO - Finished converting document 4_2024-05-16 in 0.06 sec.
2025-11-14 16:55:48,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:48,547 - INFO - Going to convert document batch...
2025-11-14 16:55:48,549 - INFO - Processing document 4_2024-06-13


Converted 'data\edgar_documents\KO\4_2024-05-14' --> 'data\processed_data\KO\4_2024-05-14.md'
Converted 'data\edgar_documents\KO\4_2024-05-16' --> 'data\processed_data\KO\4_2024-05-16.md'


2025-11-14 16:55:49,053 - INFO - Finished converting document 4_2024-06-13 in 0.53 sec.
2025-11-14 16:55:49,121 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:49,137 - INFO - Going to convert document batch...
2025-11-14 16:55:49,138 - INFO - Processing document 4_2024-06-18
2025-11-14 16:55:49,167 - INFO - Finished converting document 4_2024-06-18 in 0.09 sec.
2025-11-14 16:55:49,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:49,227 - INFO - Going to convert document batch...
2025-11-14 16:55:49,227 - INFO - Processing document 4_2024-07-05
2025-11-14 16:55:49,246 - INFO - Finished converting document 4_2024-07-05 in 0.06 sec.


Converted 'data\edgar_documents\KO\4_2024-06-13' --> 'data\processed_data\KO\4_2024-06-13.md'
Converted 'data\edgar_documents\KO\4_2024-06-18' --> 'data\processed_data\KO\4_2024-06-18.md'


2025-11-14 16:55:49,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:49,295 - INFO - Going to convert document batch...
2025-11-14 16:55:49,296 - INFO - Processing document 4_2024-07-19
2025-11-14 16:55:49,426 - INFO - Finished converting document 4_2024-07-19 in 0.16 sec.


Converted 'data\edgar_documents\KO\4_2024-07-05' --> 'data\processed_data\KO\4_2024-07-05.md'


2025-11-14 16:55:49,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:49,481 - INFO - Going to convert document batch...
2025-11-14 16:55:49,482 - INFO - Processing document 4_2024-07-30
2025-11-14 16:55:49,524 - INFO - Finished converting document 4_2024-07-30 in 0.06 sec.
2025-11-14 16:55:49,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:49,602 - INFO - Going to convert document batch...
2025-11-14 16:55:49,603 - INFO - Processing document 4_2024-08-05
2025-11-14 16:55:49,627 - INFO - Finished converting document 4_2024-08-05 in 0.08 sec.


Converted 'data\edgar_documents\KO\4_2024-07-19' --> 'data\processed_data\KO\4_2024-07-19.md'
Converted 'data\edgar_documents\KO\4_2024-07-30' --> 'data\processed_data\KO\4_2024-07-30.md'


2025-11-14 16:55:49,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:49,682 - INFO - Going to convert document batch...
2025-11-14 16:55:49,684 - INFO - Processing document 4_2024-08-06
2025-11-14 16:55:49,720 - INFO - Finished converting document 4_2024-08-06 in 0.08 sec.
2025-11-14 16:55:49,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:49,814 - INFO - Going to convert document batch...
2025-11-14 16:55:49,814 - INFO - Processing document 4_2024-08-07


Converted 'data\edgar_documents\KO\4_2024-08-05' --> 'data\processed_data\KO\4_2024-08-05.md'
Converted 'data\edgar_documents\KO\4_2024-08-06' --> 'data\processed_data\KO\4_2024-08-06.md'


2025-11-14 16:55:49,849 - INFO - Finished converting document 4_2024-08-07 in 0.09 sec.
2025-11-14 16:55:49,901 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:55:49,902 - ERROR - Input document 4_2024-08-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:55:49,904 - INFO - Going to convert document batch...
2025-11-14 16:55:49,924 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:55:49,926 - ERROR - Input document 4_2024-08-09 with forma

Converted 'data\edgar_documents\KO\4_2024-08-07' --> 'data\processed_data\KO\4_2024-08-07.md'
Error processing data\edgar_documents\KO\4_2024-08-08: File format not allowed: data\edgar_documents\KO\4_2024-08-08
Error processing data\edgar_documents\KO\4_2024-08-09: File format not allowed: data\edgar_documents\KO\4_2024-08-09


2025-11-14 16:55:50,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:50,134 - INFO - Going to convert document batch...
2025-11-14 16:55:50,135 - INFO - Processing document 4_2024-08-23
2025-11-14 16:55:50,190 - INFO - Finished converting document 4_2024-08-23 in 0.09 sec.
2025-11-14 16:55:50,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\4_2024-08-22' --> 'data\processed_data\KO\4_2024-08-22.md'
Converted 'data\edgar_documents\KO\4_2024-08-23' --> 'data\processed_data\KO\4_2024-08-23.md'


2025-11-14 16:55:50,321 - INFO - Going to convert document batch...
2025-11-14 16:55:50,322 - INFO - Processing document 4_2024-08-27
2025-11-14 16:55:50,461 - INFO - Finished converting document 4_2024-08-27 in 0.22 sec.
2025-11-14 16:55:50,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:50,531 - INFO - Going to convert document batch...
2025-11-14 16:55:50,532 - INFO - Processing document 4_2024-08-29
2025-11-14 16:55:50,557 - INFO - Finished converting document 4_2024-08-29 in 0.05 sec.
2025-11-14 16:55:50,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:50,606 - INFO - Going to convert document batch...
2025-11-14 16:55:50,607 - INFO - Processing document 4_2024-10-21
2025-11-14 16:55:50,630 - INFO - Finished converting document 4_2024-10-21 in 0.05 sec.
2025-11-14 16:55:50,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\4_2024-08-27' --> 'data\processed_data\KO\4_2024-08-27.md'
Converted 'data\edgar_documents\KO\4_2024-08-29' --> 'data\processed_data\KO\4_2024-08-29.md'
Converted 'data\edgar_documents\KO\4_2024-10-21' --> 'data\processed_data\KO\4_2024-10-21.md'


2025-11-14 16:55:50,697 - INFO - Going to convert document batch...
2025-11-14 16:55:50,699 - INFO - Processing document 4_2024-11-12
2025-11-14 16:55:50,729 - INFO - Finished converting document 4_2024-11-12 in 0.08 sec.
2025-11-14 16:55:50,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:50,781 - INFO - Going to convert document batch...
2025-11-14 16:55:50,782 - INFO - Processing document 4_2024-11-26
2025-11-14 16:55:50,809 - INFO - Finished converting document 4_2024-11-26 in 0.06 sec.
2025-11-14 16:55:50,843 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:50,855 - INFO - Going to convert document batch...
2025-11-14 16:55:50,855 - INFO - Processing document 4_2025-02-12
2025-11-14 16:55:50,877 - INFO - Finished converting document 4_2025-02-12 in 0.05 sec.
2025-11-14 16:55:50,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:50,924 - INFO - Going to convert document batch...
2025-11-14 16:55:50,925 - 

Converted 'data\edgar_documents\KO\4_2024-11-12' --> 'data\processed_data\KO\4_2024-11-12.md'
Converted 'data\edgar_documents\KO\4_2024-11-26' --> 'data\processed_data\KO\4_2024-11-26.md'
Converted 'data\edgar_documents\KO\4_2025-02-12' --> 'data\processed_data\KO\4_2025-02-12.md'


2025-11-14 16:55:50,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:51,004 - INFO - Going to convert document batch...
2025-11-14 16:55:51,039 - INFO - Processing document 4_2025-02-25
2025-11-14 16:55:51,123 - INFO - Finished converting document 4_2025-02-25 in 0.16 sec.


Converted 'data\edgar_documents\KO\4_2025-02-24' --> 'data\processed_data\KO\4_2025-02-24.md'


2025-11-14 16:55:51,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:51,215 - INFO - Going to convert document batch...
2025-11-14 16:55:51,216 - INFO - Processing document 4_2025-02-27
2025-11-14 16:55:51,242 - INFO - Finished converting document 4_2025-02-27 in 0.08 sec.
2025-11-14 16:55:51,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:51,292 - INFO - Going to convert document batch...
2025-11-14 16:55:51,293 - INFO - Processing document 4_2025-02-28
2025-11-14 16:55:51,319 - INFO - Finished converting document 4_2025-02-28 in 0.05 sec.


Converted 'data\edgar_documents\KO\4_2025-02-25' --> 'data\processed_data\KO\4_2025-02-25.md'
Converted 'data\edgar_documents\KO\4_2025-02-27' --> 'data\processed_data\KO\4_2025-02-27.md'
Converted 'data\edgar_documents\KO\4_2025-02-28' --> 'data\processed_data\KO\4_2025-02-28.md'


2025-11-14 16:55:51,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:51,432 - INFO - Going to convert document batch...
2025-11-14 16:55:51,433 - INFO - Processing document 4_2025-03-03
2025-11-14 16:55:51,464 - INFO - Finished converting document 4_2025-03-03 in 0.12 sec.
2025-11-14 16:55:51,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:51,575 - INFO - Going to convert document batch...
2025-11-14 16:55:51,576 - INFO - Processing document 4_2025-03-11
2025-11-14 16:55:51,615 - INFO - Finished converting document 4_2025-03-11 in 0.09 sec.
2025-11-14 16:55:51,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:51,684 - INFO - Going to convert document batch...
2025-11-14 16:55:51,684 - INFO - Processing document 4_2025-03-13
2025-11-14 16:55:51,710 - INFO - Finished converting document 4_2025-03-13 in 0.06 sec.


Converted 'data\edgar_documents\KO\4_2025-03-03' --> 'data\processed_data\KO\4_2025-03-03.md'
Converted 'data\edgar_documents\KO\4_2025-03-11' --> 'data\processed_data\KO\4_2025-03-11.md'


2025-11-14 16:55:51,746 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:51,762 - INFO - Going to convert document batch...
2025-11-14 16:55:51,763 - INFO - Processing document 4_2025-04-03
2025-11-14 16:55:51,795 - INFO - Finished converting document 4_2025-04-03 in 0.06 sec.
2025-11-14 16:55:51,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:51,874 - INFO - Going to convert document batch...
2025-11-14 16:55:51,875 - INFO - Processing document 4_2025-05-08
2025-11-14 16:55:51,903 - INFO - Finished converting document 4_2025-05-08 in 0.08 sec.


Converted 'data\edgar_documents\KO\4_2025-03-13' --> 'data\processed_data\KO\4_2025-03-13.md'
Converted 'data\edgar_documents\KO\4_2025-04-03' --> 'data\processed_data\KO\4_2025-04-03.md'


2025-11-14 16:55:51,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:51,959 - INFO - Going to convert document batch...
2025-11-14 16:55:51,960 - INFO - Processing document 4_2025-05-09
2025-11-14 16:55:51,994 - INFO - Finished converting document 4_2025-05-09 in 0.06 sec.


Converted 'data\edgar_documents\KO\4_2025-05-08' --> 'data\processed_data\KO\4_2025-05-08.md'


2025-11-14 16:55:52,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:52,154 - INFO - Going to convert document batch...
2025-11-14 16:55:52,155 - INFO - Processing document 4_2025-05-12
2025-11-14 16:55:52,192 - INFO - Finished converting document 4_2025-05-12 in 0.06 sec.
2025-11-14 16:55:52,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:52,282 - INFO - Going to convert document batch...
2025-11-14 16:55:52,284 - INFO - Processing document 4_2025-06-03
2025-11-14 16:55:52,328 - INFO - Finished converting document 4_2025-06-03 in 0.09 sec.


Converted 'data\edgar_documents\KO\4_2025-05-09' --> 'data\processed_data\KO\4_2025-05-09.md'
Converted 'data\edgar_documents\KO\4_2025-05-12' --> 'data\processed_data\KO\4_2025-05-12.md'


2025-11-14 16:55:52,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:52,426 - INFO - Going to convert document batch...
2025-11-14 16:55:52,427 - INFO - Processing document 4_2025-08-05
2025-11-14 16:55:52,458 - INFO - Finished converting document 4_2025-08-05 in 0.09 sec.
2025-11-14 16:55:52,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:52,525 - INFO - Going to convert document batch...
2025-11-14 16:55:52,526 - INFO - Processing document 4_2025-08-07
2025-11-14 16:55:52,547 - INFO - Finished converting document 4_2025-08-07 in 0.06 sec.


Converted 'data\edgar_documents\KO\4_2025-06-03' --> 'data\processed_data\KO\4_2025-06-03.md'
Converted 'data\edgar_documents\KO\4_2025-08-05' --> 'data\processed_data\KO\4_2025-08-05.md'


2025-11-14 16:55:52,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:52,597 - INFO - Going to convert document batch...
2025-11-14 16:55:52,598 - INFO - Processing document 4_2025-10-20
2025-11-14 16:55:52,636 - INFO - Finished converting document 4_2025-10-20 in 0.08 sec.
2025-11-14 16:55:52,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:52,701 - INFO - Going to convert document batch...
2025-11-14 16:55:52,702 - INFO - Processing document 4_2025-10-27
2025-11-14 16:55:52,726 - INFO - Finished converting document 4_2025-10-27 in 0.05 sec.


Converted 'data\edgar_documents\KO\4_2025-08-07' --> 'data\processed_data\KO\4_2025-08-07.md'
Converted 'data\edgar_documents\KO\4_2025-10-20' --> 'data\processed_data\KO\4_2025-10-20.md'
Converted 'data\edgar_documents\KO\4_2025-10-27' --> 'data\processed_data\KO\4_2025-10-27.md'


2025-11-14 16:55:52,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:52,786 - INFO - Going to convert document batch...
2025-11-14 16:55:52,787 - INFO - Processing document 4_2025-10-28
2025-11-14 16:55:52,830 - INFO - Finished converting document 4_2025-10-28 in 0.08 sec.
2025-11-14 16:55:52,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:52,937 - INFO - Going to convert document batch...
2025-11-14 16:55:52,938 - INFO - Processing document 4_2025-10-31
2025-11-14 16:55:52,963 - INFO - Finished converting document 4_2025-10-31 in 0.11 sec.
2025-11-14 16:55:53,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:53,027 - INFO - Going to convert document batch...
2025-11-14 16:55:53,028 - INFO - Processing document 4_2025-11-10


Converted 'data\edgar_documents\KO\4_2025-10-28' --> 'data\processed_data\KO\4_2025-10-28.md'
Converted 'data\edgar_documents\KO\4_2025-10-31' --> 'data\processed_data\KO\4_2025-10-31.md'


2025-11-14 16:55:53,054 - INFO - Finished converting document 4_2025-11-10 in 0.06 sec.
2025-11-14 16:55:53,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:53,123 - INFO - Going to convert document batch...
2025-11-14 16:55:53,124 - INFO - Processing document 8-K_2023-02-14
2025-11-14 16:55:53,156 - INFO - Finished converting document 8-K_2023-02-14 in 0.08 sec.
2025-11-14 16:55:53,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:53,210 - INFO - Going to convert document batch...
2025-11-14 16:55:53,211 - INFO - Processing document 8-K_2023-04-24
2025-11-14 16:55:53,239 - INFO - Finished converting document 8-K_2023-04-24 in 0.06 sec.
2025-11-14 16:55:53,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\4_2025-11-10' --> 'data\processed_data\KO\4_2025-11-10.md'
Converted 'data\edgar_documents\KO\8-K_2023-02-14' --> 'data\processed_data\KO\8-K_2023-02-14.md'
Converted 'data\edgar_documents\KO\8-K_2023-04-24' --> 'data\processed_data\KO\8-K_2023-04-24.md'


2025-11-14 16:55:53,308 - INFO - Going to convert document batch...
2025-11-14 16:55:53,309 - INFO - Processing document 8-K_2023-04-26
2025-11-14 16:55:53,388 - INFO - Finished converting document 8-K_2023-04-26 in 0.14 sec.
2025-11-14 16:55:53,478 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:53,526 - INFO - Going to convert document batch...
2025-11-14 16:55:53,527 - INFO - Processing document 8-K_2023-07-19
2025-11-14 16:55:53,565 - INFO - Finished converting document 8-K_2023-07-19 in 0.14 sec.


Converted 'data\edgar_documents\KO\8-K_2023-04-26' --> 'data\processed_data\KO\8-K_2023-04-26.md'
Converted 'data\edgar_documents\KO\8-K_2023-07-19' --> 'data\processed_data\KO\8-K_2023-07-19.md'


2025-11-14 16:55:53,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:53,662 - INFO - Going to convert document batch...
2025-11-14 16:55:53,663 - INFO - Processing document 8-K_2023-07-26
2025-11-14 16:55:53,697 - INFO - Finished converting document 8-K_2023-07-26 in 0.11 sec.
2025-11-14 16:55:53,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:53,754 - INFO - Going to convert document batch...
2025-11-14 16:55:53,755 - INFO - Processing document 8-K_2023-10-20
2025-11-14 16:55:53,786 - INFO - Finished converting document 8-K_2023-10-20 in 0.08 sec.
2025-11-14 16:55:53,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:53,829 - INFO - Going to convert document batch...
2025-11-14 16:55:53,829 - INFO - Processing document 8-K_2023-10-24
2025-11-14 16:55:53,858 - INFO - Finished converting document 8-K_2023-10-24 in 0.06 sec.
2025-11-14 16:55:53,889 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\8-K_2023-07-26' --> 'data\processed_data\KO\8-K_2023-07-26.md'
Converted 'data\edgar_documents\KO\8-K_2023-10-20' --> 'data\processed_data\KO\8-K_2023-10-20.md'
Converted 'data\edgar_documents\KO\8-K_2023-10-24' --> 'data\processed_data\KO\8-K_2023-10-24.md'


2025-11-14 16:55:53,905 - INFO - Going to convert document batch...
2025-11-14 16:55:53,906 - INFO - Processing document 8-K_2024-02-13
2025-11-14 16:55:53,955 - INFO - Finished converting document 8-K_2024-02-13 in 0.08 sec.
2025-11-14 16:55:54,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:54,021 - INFO - Going to convert document batch...
2025-11-14 16:55:54,022 - INFO - Processing document 8-K_2024-04-30


Converted 'data\edgar_documents\KO\8-K_2024-02-13' --> 'data\processed_data\KO\8-K_2024-02-13.md'


2025-11-14 16:55:54,275 - INFO - Finished converting document 8-K_2024-04-30 in 0.28 sec.
2025-11-14 16:55:54,413 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:54,484 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\KO\8-K_2024-04-30' --> 'data\processed_data\KO\8-K_2024-04-30.md'


2025-11-14 16:55:54,485 - INFO - Processing document 8-K_2024-05-02
2025-11-14 16:55:54,674 - INFO - Finished converting document 8-K_2024-05-02 in 0.38 sec.
2025-11-14 16:55:54,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:54,841 - INFO - Going to convert document batch...
2025-11-14 16:55:54,842 - INFO - Processing document 8-K_2024-05-08
2025-11-14 16:55:54,923 - INFO - Finished converting document 8-K_2024-05-08 in 0.17 sec.


Converted 'data\edgar_documents\KO\8-K_2024-05-02' --> 'data\processed_data\KO\8-K_2024-05-02.md'


2025-11-14 16:55:55,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:55,053 - INFO - Going to convert document batch...
2025-11-14 16:55:55,055 - INFO - Processing document 8-K_2024-05-13


Converted 'data\edgar_documents\KO\8-K_2024-05-08' --> 'data\processed_data\KO\8-K_2024-05-08.md'


2025-11-14 16:55:55,157 - INFO - Finished converting document 8-K_2024-05-13 in 0.20 sec.
2025-11-14 16:55:55,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:55,307 - INFO - Going to convert document batch...
2025-11-14 16:55:55,308 - INFO - Processing document 8-K_2024-05-14
2025-11-14 16:55:55,359 - INFO - Finished converting document 8-K_2024-05-14 in 0.17 sec.


Converted 'data\edgar_documents\KO\8-K_2024-05-13' --> 'data\processed_data\KO\8-K_2024-05-13.md'
Converted 'data\edgar_documents\KO\8-K_2024-05-14' --> 'data\processed_data\KO\8-K_2024-05-14.md'


2025-11-14 16:55:55,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:55,454 - INFO - Going to convert document batch...
2025-11-14 16:55:55,456 - INFO - Processing document 8-K_2024-07-23
2025-11-14 16:55:55,572 - INFO - Finished converting document 8-K_2024-07-23 in 0.17 sec.
2025-11-14 16:55:55,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:55,669 - INFO - Going to convert document batch...
2025-11-14 16:55:55,671 - INFO - Processing document 8-K_2024-08-09
2025-11-14 16:55:55,720 - INFO - Finished converting document 8-K_2024-08-09 in 0.12 sec.


Converted 'data\edgar_documents\KO\8-K_2024-07-23' --> 'data\processed_data\KO\8-K_2024-07-23.md'
Converted 'data\edgar_documents\KO\8-K_2024-08-09' --> 'data\processed_data\KO\8-K_2024-08-09.md'


2025-11-14 16:55:55,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:55,870 - INFO - Going to convert document batch...
2025-11-14 16:55:55,871 - INFO - Processing document 8-K_2024-08-14
2025-11-14 16:55:55,937 - INFO - Finished converting document 8-K_2024-08-14 in 0.17 sec.
2025-11-14 16:55:56,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:56,115 - INFO - Going to convert document batch...
2025-11-14 16:55:56,116 - INFO - Processing document 8-K_2024-08-15
2025-11-14 16:55:56,163 - INFO - Finished converting document 8-K_2024-08-15 in 0.11 sec.
2025-11-14 16:55:56,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\8-K_2024-08-14' --> 'data\processed_data\KO\8-K_2024-08-14.md'
Converted 'data\edgar_documents\KO\8-K_2024-08-15' --> 'data\processed_data\KO\8-K_2024-08-15.md'


2025-11-14 16:55:56,265 - INFO - Going to convert document batch...
2025-11-14 16:55:56,266 - INFO - Processing document 8-K_2024-08-21
2025-11-14 16:55:56,306 - INFO - Finished converting document 8-K_2024-08-21 in 0.08 sec.
2025-11-14 16:55:56,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:56,358 - INFO - Going to convert document batch...
2025-11-14 16:55:56,358 - INFO - Processing document 8-K_2024-10-17
2025-11-14 16:55:56,392 - INFO - Finished converting document 8-K_2024-10-17 in 0.06 sec.
2025-11-14 16:55:56,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:56,444 - INFO - Going to convert document batch...
2025-11-14 16:55:56,445 - INFO - Processing document 8-K_2024-10-23
2025-11-14 16:55:56,479 - INFO - Finished converting document 8-K_2024-10-23 in 0.08 sec.
2025-11-14 16:55:56,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\8-K_2024-08-21' --> 'data\processed_data\KO\8-K_2024-08-21.md'
Converted 'data\edgar_documents\KO\8-K_2024-10-17' --> 'data\processed_data\KO\8-K_2024-10-17.md'
Converted 'data\edgar_documents\KO\8-K_2024-10-23' --> 'data\processed_data\KO\8-K_2024-10-23.md'


2025-11-14 16:55:56,548 - INFO - Going to convert document batch...
2025-11-14 16:55:56,549 - INFO - Processing document 8-K_2024-12-11
2025-11-14 16:55:56,618 - INFO - Finished converting document 8-K_2024-12-11 in 0.11 sec.
2025-11-14 16:55:56,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:56,792 - INFO - Going to convert document batch...
2025-11-14 16:55:56,793 - INFO - Processing document 8-K_2024-12-16
2025-11-14 16:55:56,849 - INFO - Finished converting document 8-K_2024-12-16 in 0.12 sec.
2025-11-14 16:55:56,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\8-K_2024-12-11' --> 'data\processed_data\KO\8-K_2024-12-11.md'
Converted 'data\edgar_documents\KO\8-K_2024-12-16' --> 'data\processed_data\KO\8-K_2024-12-16.md'


2025-11-14 16:55:56,913 - INFO - Going to convert document batch...
2025-11-14 16:55:56,915 - INFO - Processing document 8-K_2025-02-11
2025-11-14 16:55:56,950 - INFO - Finished converting document 8-K_2025-02-11 in 0.08 sec.
2025-11-14 16:55:56,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:57,013 - INFO - Going to convert document batch...
2025-11-14 16:55:57,014 - INFO - Processing document 8-K_2025-03-27
2025-11-14 16:55:57,043 - INFO - Finished converting document 8-K_2025-03-27 in 0.08 sec.
2025-11-14 16:55:57,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:57,090 - INFO - Going to convert document batch...
2025-11-14 16:55:57,091 - INFO - Processing document 8-K_2025-04-29
2025-11-14 16:55:57,122 - INFO - Finished converting document 8-K_2025-04-29 in 0.06 sec.
2025-11-14 16:55:57,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\8-K_2025-02-11' --> 'data\processed_data\KO\8-K_2025-02-11.md'
Converted 'data\edgar_documents\KO\8-K_2025-03-27' --> 'data\processed_data\KO\8-K_2025-03-27.md'
Converted 'data\edgar_documents\KO\8-K_2025-04-29' --> 'data\processed_data\KO\8-K_2025-04-29.md'


2025-11-14 16:55:57,187 - INFO - Going to convert document batch...
2025-11-14 16:55:57,188 - INFO - Processing document 8-K_2025-05-02
2025-11-14 16:55:57,272 - INFO - Finished converting document 8-K_2025-05-02 in 0.12 sec.
2025-11-14 16:55:57,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\8-K_2025-05-02' --> 'data\processed_data\KO\8-K_2025-05-02.md'


2025-11-14 16:55:57,700 - INFO - Going to convert document batch...
2025-11-14 16:55:57,701 - INFO - Processing document 8-K_2025-06-26
2025-11-14 16:55:57,851 - INFO - Finished converting document 8-K_2025-06-26 in 0.49 sec.
2025-11-14 16:55:57,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:57,959 - INFO - Going to convert document batch...
2025-11-14 16:55:57,960 - INFO - Processing document 8-K_2025-07-22
2025-11-14 16:55:57,991 - INFO - Finished converting document 8-K_2025-07-22 in 0.11 sec.
2025-11-14 16:55:58,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:58,056 - INFO - Going to convert document batch...
2025-11-14 16:55:58,057 - INFO - Processing document 8-K_2025-10-16


Converted 'data\edgar_documents\KO\8-K_2025-06-26' --> 'data\processed_data\KO\8-K_2025-06-26.md'
Converted 'data\edgar_documents\KO\8-K_2025-07-22' --> 'data\processed_data\KO\8-K_2025-07-22.md'


2025-11-14 16:55:58,089 - INFO - Finished converting document 8-K_2025-10-16 in 0.09 sec.
2025-11-14 16:55:58,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:55:58,149 - INFO - Going to convert document batch...
2025-11-14 16:55:58,150 - INFO - Processing document 8-K_2025-10-21
2025-11-14 16:55:58,178 - INFO - Finished converting document 8-K_2025-10-21 in 0.06 sec.
2025-11-14 16:55:58,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\8-K_2025-10-16' --> 'data\processed_data\KO\8-K_2025-10-16.md'
Converted 'data\edgar_documents\KO\8-K_2025-10-21' --> 'data\processed_data\KO\8-K_2025-10-21.md'


2025-11-14 16:55:59,954 - INFO - Going to convert document batch...
2025-11-14 16:55:59,955 - INFO - Processing document DEF-14A_2023-03-10
2025-11-14 16:56:24,647 - INFO - Finished converting document DEF-14A_2023-03-10 in 26.44 sec.


Converted 'data\edgar_documents\KO\DEF-14A_2023-03-10' --> 'data\processed_data\KO\DEF-14A_2023-03-10.md'


2025-11-14 16:56:27,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:56:29,534 - INFO - Going to convert document batch...
2025-11-14 16:56:29,534 - INFO - Processing document DEF-14A_2024-03-18
2025-11-14 16:56:53,962 - INFO - Finished converting document DEF-14A_2024-03-18 in 27.00 sec.
2025-11-14 16:56:56,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\DEF-14A_2024-03-18' --> 'data\processed_data\KO\DEF-14A_2024-03-18.md'


2025-11-14 16:56:59,391 - INFO - Going to convert document batch...
2025-11-14 16:56:59,394 - INFO - Processing document DEF-14A_2025-03-17
2025-11-14 16:57:12,776 - INFO - Finished converting document DEF-14A_2025-03-17 in 16.62 sec.
2025-11-14 16:57:14,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\KO\DEF-14A_2025-03-17' --> 'data\processed_data\KO\DEF-14A_2025-03-17.md'
Processed 122 new files. Errors: 4
Found 94 files to process in data\edgar_documents\LIN


2025-11-14 16:57:15,628 - INFO - Going to convert document batch...
2025-11-14 16:57:15,630 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:57:15,631 - INFO - Processing document 10-K_2023-02-28
2025-11-14 16:57:18,785 - INFO - Finished converting document 10-K_2023-02-28 in 4.30 sec.
2025-11-14 16:57:19,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-K_2023-02-28' --> 'data\processed_data\LIN\10-K_2023-02-28.md'


2025-11-14 16:57:20,978 - INFO - Going to convert document batch...
2025-11-14 16:57:20,979 - INFO - Processing document 10-K_2024-02-28
2025-11-14 16:57:23,679 - INFO - Finished converting document 10-K_2024-02-28 in 4.09 sec.
2025-11-14 16:57:24,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-K_2024-02-28' --> 'data\processed_data\LIN\10-K_2024-02-28.md'


2025-11-14 16:57:25,967 - INFO - Going to convert document batch...
2025-11-14 16:57:25,969 - INFO - Processing document 10-K_2025-02-26
2025-11-14 16:57:28,146 - INFO - Finished converting document 10-K_2025-02-26 in 3.61 sec.
2025-11-14 16:57:29,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-K_2025-02-26' --> 'data\processed_data\LIN\10-K_2025-02-26.md'


2025-11-14 16:57:29,412 - INFO - Going to convert document batch...
2025-11-14 16:57:29,413 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 16:57:30,092 - INFO - Finished converting document 10-Q_2023-04-27 in 1.12 sec.
2025-11-14 16:57:30,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-Q_2023-04-27' --> 'data\processed_data\LIN\10-Q_2023-04-27.md'


2025-11-14 16:57:31,747 - INFO - Going to convert document batch...
2025-11-14 16:57:31,748 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 16:57:32,629 - INFO - Finished converting document 10-Q_2023-07-27 in 2.14 sec.
2025-11-14 16:57:33,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-Q_2023-07-27' --> 'data\processed_data\LIN\10-Q_2023-07-27.md'


2025-11-14 16:57:33,886 - INFO - Going to convert document batch...
2025-11-14 16:57:33,887 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 16:57:34,853 - INFO - Finished converting document 10-Q_2023-10-26 in 1.66 sec.
2025-11-14 16:57:35,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-Q_2023-10-26' --> 'data\processed_data\LIN\10-Q_2023-10-26.md'


2025-11-14 16:57:36,400 - INFO - Going to convert document batch...
2025-11-14 16:57:36,401 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 16:57:37,229 - INFO - Finished converting document 10-Q_2024-05-02 in 1.41 sec.
2025-11-14 16:57:37,721 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-Q_2024-05-02' --> 'data\processed_data\LIN\10-Q_2024-05-02.md'


2025-11-14 16:57:38,571 - INFO - Going to convert document batch...
2025-11-14 16:57:38,572 - INFO - Processing document 10-Q_2024-08-02
2025-11-14 16:57:39,558 - INFO - Finished converting document 10-Q_2024-08-02 in 1.95 sec.
2025-11-14 16:57:40,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-Q_2024-08-02' --> 'data\processed_data\LIN\10-Q_2024-08-02.md'


2025-11-14 16:57:40,620 - INFO - Going to convert document batch...
2025-11-14 16:57:40,621 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 16:57:41,457 - INFO - Finished converting document 10-Q_2024-10-31 in 1.45 sec.
2025-11-14 16:57:42,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-Q_2024-10-31' --> 'data\processed_data\LIN\10-Q_2024-10-31.md'


2025-11-14 16:57:42,917 - INFO - Going to convert document batch...
2025-11-14 16:57:42,917 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 16:57:43,589 - INFO - Finished converting document 10-Q_2025-05-01 in 1.67 sec.
2025-11-14 16:57:44,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-Q_2025-05-01' --> 'data\processed_data\LIN\10-Q_2025-05-01.md'


2025-11-14 16:57:44,570 - INFO - Going to convert document batch...
2025-11-14 16:57:44,571 - INFO - Processing document 10-Q_2025-08-01
2025-11-14 16:57:45,402 - INFO - Finished converting document 10-Q_2025-08-01 in 1.44 sec.
2025-11-14 16:57:45,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\10-Q_2025-08-01' --> 'data\processed_data\LIN\10-Q_2025-08-01.md'


2025-11-14 16:57:46,867 - INFO - Going to convert document batch...
2025-11-14 16:57:46,868 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 16:57:47,902 - INFO - Finished converting document 10-Q_2025-10-31 in 2.06 sec.
2025-11-14 16:57:48,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:48,647 - INFO - Going to convert document batch...
2025-11-14 16:57:48,647 - INFO - Processing document 4_2023-01-24
2025-11-14 16:57:48,708 - INFO - Finished converting document 4_2023-01-24 in 0.14 sec.


Converted 'data\edgar_documents\LIN\10-Q_2025-10-31' --> 'data\processed_data\LIN\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\LIN\4_2023-01-24' --> 'data\processed_data\LIN\4_2023-01-24.md'


2025-11-14 16:57:48,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:48,829 - INFO - Going to convert document batch...
2025-11-14 16:57:48,830 - INFO - Processing document 4_2023-02-15
2025-11-14 16:57:48,896 - INFO - Finished converting document 4_2023-02-15 in 0.12 sec.
2025-11-14 16:57:48,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:49,005 - INFO - Going to convert document batch...
2025-11-14 16:57:49,006 - INFO - Processing document 4_2023-03-07
2025-11-14 16:57:49,062 - INFO - Finished converting document 4_2023-03-07 in 0.12 sec.
2025-11-14 16:57:49,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:49,132 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LIN\4_2023-02-15' --> 'data\processed_data\LIN\4_2023-02-15.md'
Converted 'data\edgar_documents\LIN\4_2023-03-07' --> 'data\processed_data\LIN\4_2023-03-07.md'


2025-11-14 16:57:49,133 - INFO - Processing document 4_2023-03-09
2025-11-14 16:57:49,194 - INFO - Finished converting document 4_2023-03-09 in 0.09 sec.
2025-11-14 16:57:49,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:49,295 - INFO - Going to convert document batch...
2025-11-14 16:57:49,296 - INFO - Processing document 4_2023-03-13
2025-11-14 16:57:49,365 - INFO - Finished converting document 4_2023-03-13 in 0.11 sec.


Converted 'data\edgar_documents\LIN\4_2023-03-09' --> 'data\processed_data\LIN\4_2023-03-09.md'
Converted 'data\edgar_documents\LIN\4_2023-03-13' --> 'data\processed_data\LIN\4_2023-03-13.md'


2025-11-14 16:57:49,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:49,533 - INFO - Going to convert document batch...
2025-11-14 16:57:49,533 - INFO - Processing document 4_2023-03-22
2025-11-14 16:57:49,750 - INFO - Finished converting document 4_2023-03-22 in 0.33 sec.
2025-11-14 16:57:49,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:49,898 - INFO - Going to convert document batch...
2025-11-14 16:57:49,900 - INFO - Processing document 4_2023-04-20
2025-11-14 16:57:49,931 - INFO - Finished converting document 4_2023-04-20 in 0.09 sec.
2025-11-14 16:57:49,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:50,000 - INFO - Going to convert document batch...
2025-11-14 16:57:50,001 - INFO - Processing document 4_2023-05-03


Converted 'data\edgar_documents\LIN\4_2023-03-22' --> 'data\processed_data\LIN\4_2023-03-22.md'
Converted 'data\edgar_documents\LIN\4_2023-04-20' --> 'data\processed_data\LIN\4_2023-04-20.md'


2025-11-14 16:57:50,086 - INFO - Finished converting document 4_2023-05-03 in 0.12 sec.
2025-11-14 16:57:50,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:50,230 - INFO - Going to convert document batch...
2025-11-14 16:57:50,232 - INFO - Processing document 4_2023-05-17
2025-11-14 16:57:50,288 - INFO - Finished converting document 4_2023-05-17 in 0.12 sec.


Converted 'data\edgar_documents\LIN\4_2023-05-03' --> 'data\processed_data\LIN\4_2023-05-03.md'
Converted 'data\edgar_documents\LIN\4_2023-05-17' --> 'data\processed_data\LIN\4_2023-05-17.md'


2025-11-14 16:57:50,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:50,400 - INFO - Going to convert document batch...
2025-11-14 16:57:50,402 - INFO - Processing document 4_2023-05-19
2025-11-14 16:57:50,574 - INFO - Finished converting document 4_2023-05-19 in 0.22 sec.
2025-11-14 16:57:50,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:50,655 - INFO - Going to convert document batch...
2025-11-14 16:57:50,656 - INFO - Processing document 4_2023-06-16
2025-11-14 16:57:50,710 - INFO - Finished converting document 4_2023-06-16 in 0.08 sec.
2025-11-14 16:57:50,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\4_2023-05-19' --> 'data\processed_data\LIN\4_2023-05-19.md'
Converted 'data\edgar_documents\LIN\4_2023-06-16' --> 'data\processed_data\LIN\4_2023-06-16.md'


2025-11-14 16:57:51,306 - INFO - Going to convert document batch...
2025-11-14 16:57:51,306 - INFO - Processing document 4_2023-08-03
2025-11-14 16:57:51,379 - INFO - Finished converting document 4_2023-08-03 in 0.61 sec.
2025-11-14 16:57:51,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:51,460 - INFO - Going to convert document batch...
2025-11-14 16:57:51,461 - INFO - Processing document 4_2023-09-11
2025-11-14 16:57:51,503 - INFO - Finished converting document 4_2023-09-11 in 0.08 sec.
2025-11-14 16:57:51,560 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:51,588 - INFO - Going to convert document batch...
2025-11-14 16:57:51,589 - INFO - Processing document 4_2023-09-18


Converted 'data\edgar_documents\LIN\4_2023-08-03' --> 'data\processed_data\LIN\4_2023-08-03.md'
Converted 'data\edgar_documents\LIN\4_2023-09-11' --> 'data\processed_data\LIN\4_2023-09-11.md'


2025-11-14 16:57:51,644 - INFO - Finished converting document 4_2023-09-18 in 0.11 sec.
2025-11-14 16:57:51,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:51,847 - INFO - Going to convert document batch...
2025-11-14 16:57:51,848 - INFO - Processing document 4_2024-01-23


Converted 'data\edgar_documents\LIN\4_2023-09-18' --> 'data\processed_data\LIN\4_2023-09-18.md'


2025-11-14 16:57:51,902 - INFO - Finished converting document 4_2024-01-23 in 0.22 sec.
2025-11-14 16:57:52,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:52,138 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LIN\4_2024-01-23' --> 'data\processed_data\LIN\4_2024-01-23.md'


2025-11-14 16:57:52,139 - INFO - Processing document 4_2024-02-12
2025-11-14 16:57:52,207 - INFO - Finished converting document 4_2024-02-12 in 0.25 sec.
2025-11-14 16:57:52,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:52,306 - INFO - Going to convert document batch...
2025-11-14 16:57:52,307 - INFO - Processing document 4_2024-03-06
2025-11-14 16:57:52,354 - INFO - Finished converting document 4_2024-03-06 in 0.11 sec.
2025-11-14 16:57:52,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\4_2024-02-12' --> 'data\processed_data\LIN\4_2024-02-12.md'
Converted 'data\edgar_documents\LIN\4_2024-03-06' --> 'data\processed_data\LIN\4_2024-03-06.md'


2025-11-14 16:57:52,479 - INFO - Going to convert document batch...
2025-11-14 16:57:52,481 - INFO - Processing document 4_2024-03-07
2025-11-14 16:57:52,618 - INFO - Finished converting document 4_2024-03-07 in 0.22 sec.
2025-11-14 16:57:52,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:52,767 - INFO - Going to convert document batch...
2025-11-14 16:57:52,768 - INFO - Processing document 4_2024-03-08
2025-11-14 16:57:52,822 - INFO - Finished converting document 4_2024-03-08 in 0.16 sec.


Converted 'data\edgar_documents\LIN\4_2024-03-07' --> 'data\processed_data\LIN\4_2024-03-07.md'


2025-11-14 16:57:52,906 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:52,923 - INFO - Going to convert document batch...
2025-11-14 16:57:52,923 - INFO - Processing document 4_2024-03-11
2025-11-14 16:57:52,978 - INFO - Finished converting document 4_2024-03-11 in 0.11 sec.


Converted 'data\edgar_documents\LIN\4_2024-03-08' --> 'data\processed_data\LIN\4_2024-03-08.md'
Converted 'data\edgar_documents\LIN\4_2024-03-11' --> 'data\processed_data\LIN\4_2024-03-11.md'


2025-11-14 16:57:53,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:53,190 - INFO - Going to convert document batch...
2025-11-14 16:57:53,192 - INFO - Processing document 4_2024-03-13
2025-11-14 16:57:53,269 - INFO - Finished converting document 4_2024-03-13 in 0.25 sec.
2025-11-14 16:57:53,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:53,408 - INFO - Going to convert document batch...
2025-11-14 16:57:53,409 - INFO - Processing document 4_2024-03-14
2025-11-14 16:57:53,475 - INFO - Finished converting document 4_2024-03-14 in 0.14 sec.


Converted 'data\edgar_documents\LIN\4_2024-03-13' --> 'data\processed_data\LIN\4_2024-03-13.md'


2025-11-14 16:57:53,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:53,588 - INFO - Going to convert document batch...
2025-11-14 16:57:53,589 - INFO - Processing document 4_2024-03-18
2025-11-14 16:57:53,655 - INFO - Finished converting document 4_2024-03-18 in 0.14 sec.


Converted 'data\edgar_documents\LIN\4_2024-03-14' --> 'data\processed_data\LIN\4_2024-03-14.md'


2025-11-14 16:57:53,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:53,846 - INFO - Going to convert document batch...
2025-11-14 16:57:53,848 - INFO - Processing document 4_2024-05-15
2025-11-14 16:57:53,902 - INFO - Finished converting document 4_2024-05-15 in 0.19 sec.


Converted 'data\edgar_documents\LIN\4_2024-03-18' --> 'data\processed_data\LIN\4_2024-03-18.md'


2025-11-14 16:57:53,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:54,019 - INFO - Going to convert document batch...
2025-11-14 16:57:54,019 - INFO - Processing document 4_2024-08-20
2025-11-14 16:57:54,078 - INFO - Finished converting document 4_2024-08-20 in 0.09 sec.
2025-11-14 16:57:54,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:54,154 - INFO - Going to convert document batch...
2025-11-14 16:57:54,155 - INFO - Processing document 4_2024-08-23


Converted 'data\edgar_documents\LIN\4_2024-05-15' --> 'data\processed_data\LIN\4_2024-05-15.md'
Converted 'data\edgar_documents\LIN\4_2024-08-20' --> 'data\processed_data\LIN\4_2024-08-20.md'


2025-11-14 16:57:54,228 - INFO - Finished converting document 4_2024-08-23 in 0.11 sec.
2025-11-14 16:57:54,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:54,377 - INFO - Going to convert document batch...
2025-11-14 16:57:54,378 - INFO - Processing document 4_2024-09-11
2025-11-14 16:57:54,427 - INFO - Finished converting document 4_2024-09-11 in 0.12 sec.
2025-11-14 16:57:54,482 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\4_2024-08-23' --> 'data\processed_data\LIN\4_2024-08-23.md'
Converted 'data\edgar_documents\LIN\4_2024-09-11' --> 'data\processed_data\LIN\4_2024-09-11.md'


2025-11-14 16:57:54,494 - INFO - Going to convert document batch...
2025-11-14 16:57:54,495 - INFO - Processing document 4_2024-10-02
2025-11-14 16:57:54,526 - INFO - Finished converting document 4_2024-10-02 in 0.06 sec.
2025-11-14 16:57:54,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:54,687 - INFO - Going to convert document batch...
2025-11-14 16:57:54,687 - INFO - Processing document 4_2024-12-06
2025-11-14 16:57:54,748 - INFO - Finished converting document 4_2024-12-06 in 0.14 sec.


Converted 'data\edgar_documents\LIN\4_2024-10-02' --> 'data\processed_data\LIN\4_2024-10-02.md'


2025-11-14 16:57:54,848 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:54,860 - INFO - Going to convert document batch...
2025-11-14 16:57:54,861 - INFO - Processing document 4_2024-12-12
2025-11-14 16:57:54,887 - INFO - Finished converting document 4_2024-12-12 in 0.09 sec.
2025-11-14 16:57:54,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:54,951 - INFO - Going to convert document batch...
2025-11-14 16:57:54,953 - INFO - Processing document 4_2024-12-17
2025-11-14 16:57:54,998 - INFO - Finished converting document 4_2024-12-17 in 0.08 sec.


Converted 'data\edgar_documents\LIN\4_2024-12-06' --> 'data\processed_data\LIN\4_2024-12-06.md'
Converted 'data\edgar_documents\LIN\4_2024-12-12' --> 'data\processed_data\LIN\4_2024-12-12.md'


2025-11-14 16:57:55,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:55,082 - INFO - Going to convert document batch...
2025-11-14 16:57:55,083 - INFO - Processing document 4_2024-12-26
2025-11-14 16:57:55,156 - INFO - Finished converting document 4_2024-12-26 in 0.12 sec.


Converted 'data\edgar_documents\LIN\4_2024-12-17' --> 'data\processed_data\LIN\4_2024-12-17.md'
Converted 'data\edgar_documents\LIN\4_2024-12-26' --> 'data\processed_data\LIN\4_2024-12-26.md'


2025-11-14 16:57:55,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:55,300 - INFO - Going to convert document batch...
2025-11-14 16:57:55,580 - INFO - Processing document 4_2025-01-21
2025-11-14 16:57:55,644 - INFO - Finished converting document 4_2025-01-21 in 0.42 sec.
2025-11-14 16:57:55,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:55,753 - INFO - Going to convert document batch...
2025-11-14 16:57:55,755 - INFO - Processing document 4_2025-02-05
2025-11-14 16:57:55,784 - INFO - Finished converting document 4_2025-02-05 in 0.09 sec.
2025-11-14 16:57:55,861 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:55,872 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LIN\4_2025-01-21' --> 'data\processed_data\LIN\4_2025-01-21.md'
Converted 'data\edgar_documents\LIN\4_2025-02-05' --> 'data\processed_data\LIN\4_2025-02-05.md'


2025-11-14 16:57:55,873 - INFO - Processing document 4_2025-02-12
2025-11-14 16:57:55,934 - INFO - Finished converting document 4_2025-02-12 in 0.11 sec.
2025-11-14 16:57:55,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:55,992 - INFO - Going to convert document batch...
2025-11-14 16:57:55,993 - INFO - Processing document 4_2025-02-21
2025-11-14 16:57:56,044 - INFO - Finished converting document 4_2025-02-21 in 0.09 sec.
2025-11-14 16:57:56,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\4_2025-02-12' --> 'data\processed_data\LIN\4_2025-02-12.md'
Converted 'data\edgar_documents\LIN\4_2025-02-21' --> 'data\processed_data\LIN\4_2025-02-21.md'


2025-11-14 16:57:56,172 - INFO - Going to convert document batch...
2025-11-14 16:57:56,173 - INFO - Processing document 4_2025-02-27
2025-11-14 16:57:56,236 - INFO - Finished converting document 4_2025-02-27 in 0.16 sec.
2025-11-14 16:57:56,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:56,362 - INFO - Going to convert document batch...
2025-11-14 16:57:56,362 - INFO - Processing document 4_2025-03-04
2025-11-14 16:57:56,421 - INFO - Finished converting document 4_2025-03-04 in 0.14 sec.


Converted 'data\edgar_documents\LIN\4_2025-02-27' --> 'data\processed_data\LIN\4_2025-02-27.md'
Converted 'data\edgar_documents\LIN\4_2025-03-04' --> 'data\processed_data\LIN\4_2025-03-04.md'


2025-11-14 16:57:56,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:56,544 - INFO - Going to convert document batch...
2025-11-14 16:57:56,545 - INFO - Processing document 4_2025-03-06
2025-11-14 16:57:56,710 - INFO - Finished converting document 4_2025-03-06 in 0.23 sec.
2025-11-14 16:57:56,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:56,843 - INFO - Going to convert document batch...
2025-11-14 16:57:56,845 - INFO - Processing document 4_2025-03-11
2025-11-14 16:57:56,920 - INFO - Finished converting document 4_2025-03-11 in 0.17 sec.


Converted 'data\edgar_documents\LIN\4_2025-03-06' --> 'data\processed_data\LIN\4_2025-03-06.md'


2025-11-14 16:57:57,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:57,052 - INFO - Going to convert document batch...
2025-11-14 16:57:57,052 - INFO - Processing document 4_2025-03-12
2025-11-14 16:57:57,102 - INFO - Finished converting document 4_2025-03-12 in 0.11 sec.


Converted 'data\edgar_documents\LIN\4_2025-03-11' --> 'data\processed_data\LIN\4_2025-03-11.md'
Converted 'data\edgar_documents\LIN\4_2025-03-12' --> 'data\processed_data\LIN\4_2025-03-12.md'


2025-11-14 16:57:57,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:57,205 - INFO - Going to convert document batch...
2025-11-14 16:57:57,207 - INFO - Processing document 4_2025-04-02
2025-11-14 16:57:57,329 - INFO - Finished converting document 4_2025-04-02 in 0.17 sec.
2025-11-14 16:57:57,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:57,444 - INFO - Going to convert document batch...
2025-11-14 16:57:57,445 - INFO - Processing document 4_2025-05-20
2025-11-14 16:57:57,494 - INFO - Finished converting document 4_2025-05-20 in 0.12 sec.
2025-11-14 16:57:57,587 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\4_2025-04-02' --> 'data\processed_data\LIN\4_2025-04-02.md'
Converted 'data\edgar_documents\LIN\4_2025-05-20' --> 'data\processed_data\LIN\4_2025-05-20.md'


2025-11-14 16:57:57,620 - INFO - Going to convert document batch...
2025-11-14 16:57:57,621 - INFO - Processing document 4_2025-05-27
2025-11-14 16:57:57,694 - INFO - Finished converting document 4_2025-05-27 in 0.16 sec.
2025-11-14 16:57:57,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:57,824 - INFO - Going to convert document batch...
2025-11-14 16:57:57,826 - INFO - Processing document 4_2025-07-02
2025-11-14 16:57:57,853 - INFO - Finished converting document 4_2025-07-02 in 0.09 sec.
2025-11-14 16:57:57,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:57,935 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LIN\4_2025-05-27' --> 'data\processed_data\LIN\4_2025-05-27.md'
Converted 'data\edgar_documents\LIN\4_2025-07-02' --> 'data\processed_data\LIN\4_2025-07-02.md'


2025-11-14 16:57:57,936 - INFO - Processing document 4_2025-08-08
2025-11-14 16:57:58,005 - INFO - Finished converting document 4_2025-08-08 in 0.12 sec.
2025-11-14 16:57:58,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:58,144 - INFO - Going to convert document batch...
2025-11-14 16:57:58,145 - INFO - Processing document 4_2025-08-19
2025-11-14 16:57:58,216 - INFO - Finished converting document 4_2025-08-19 in 0.17 sec.


Converted 'data\edgar_documents\LIN\4_2025-08-08' --> 'data\processed_data\LIN\4_2025-08-08.md'


2025-11-14 16:57:58,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:58,292 - INFO - Going to convert document batch...
2025-11-14 16:57:58,294 - INFO - Processing document 4_2025-09-15
2025-11-14 16:57:58,435 - INFO - Finished converting document 4_2025-09-15 in 0.19 sec.


Converted 'data\edgar_documents\LIN\4_2025-08-19' --> 'data\processed_data\LIN\4_2025-08-19.md'


2025-11-14 16:57:58,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:58,547 - INFO - Going to convert document batch...
2025-11-14 16:57:58,548 - INFO - Processing document 4_2025-10-02
2025-11-14 16:57:58,670 - INFO - Finished converting document 4_2025-10-02 in 0.19 sec.


Converted 'data\edgar_documents\LIN\4_2025-09-15' --> 'data\processed_data\LIN\4_2025-09-15.md'


2025-11-14 16:57:58,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:58,775 - INFO - Going to convert document batch...
2025-11-14 16:57:58,776 - INFO - Processing document 8-K_2023-01-23
2025-11-14 16:57:58,807 - INFO - Finished converting document 8-K_2023-01-23 in 0.11 sec.
2025-11-14 16:57:58,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:58,850 - INFO - Going to convert document batch...
2025-11-14 16:57:58,850 - INFO - Processing document 8-K_2023-01-24
2025-11-14 16:57:58,866 - INFO - Finished converting document 8-K_2023-01-24 in 0.03 sec.
2025-11-14 16:57:58,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\4_2025-10-02' --> 'data\processed_data\LIN\4_2025-10-02.md'
Converted 'data\edgar_documents\LIN\8-K_2023-01-23' --> 'data\processed_data\LIN\8-K_2023-01-23.md'
Converted 'data\edgar_documents\LIN\8-K_2023-01-24' --> 'data\processed_data\LIN\8-K_2023-01-24.md'


2025-11-14 16:57:58,912 - INFO - Going to convert document batch...
2025-11-14 16:57:58,913 - INFO - Processing document 8-K_2023-02-07
2025-11-14 16:57:58,934 - INFO - Finished converting document 8-K_2023-02-07 in 0.06 sec.
2025-11-14 16:57:58,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:58,984 - INFO - Going to convert document batch...
2025-11-14 16:57:58,985 - INFO - Processing document 8-K_2023-03-01
2025-11-14 16:57:59,097 - INFO - Finished converting document 8-K_2023-03-01 in 0.14 sec.


Converted 'data\edgar_documents\LIN\8-K_2023-02-07' --> 'data\processed_data\LIN\8-K_2023-02-07.md'
Converted 'data\edgar_documents\LIN\8-K_2023-03-01' --> 'data\processed_data\LIN\8-K_2023-03-01.md'


2025-11-14 16:57:59,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:59,207 - INFO - Going to convert document batch...
2025-11-14 16:57:59,208 - INFO - Processing document 8-K_2023-04-27
2025-11-14 16:57:59,234 - INFO - Finished converting document 8-K_2023-04-27 in 0.11 sec.
2025-11-14 16:57:59,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:59,293 - INFO - Going to convert document batch...
2025-11-14 16:57:59,294 - INFO - Processing document 8-K_2023-04-28
2025-11-14 16:57:59,344 - INFO - Finished converting document 8-K_2023-04-28 in 0.09 sec.
2025-11-14 16:57:59,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:59,386 - INFO - Going to convert document batch...
2025-11-14 16:57:59,387 - INFO - Processing document 8-K_2023-06-12
2025-11-14 16:57:59,413 - INFO - Finished converting document 8-K_2023-06-12 in 0.05 sec.


Converted 'data\edgar_documents\LIN\8-K_2023-04-27' --> 'data\processed_data\LIN\8-K_2023-04-27.md'
Converted 'data\edgar_documents\LIN\8-K_2023-04-28' --> 'data\processed_data\LIN\8-K_2023-04-28.md'
Converted 'data\edgar_documents\LIN\8-K_2023-06-12' --> 'data\processed_data\LIN\8-K_2023-06-12.md'


2025-11-14 16:57:59,460 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:59,480 - INFO - Going to convert document batch...
2025-11-14 16:57:59,481 - INFO - Processing document 8-K_2023-07-27
2025-11-14 16:57:59,512 - INFO - Finished converting document 8-K_2023-07-27 in 0.09 sec.
2025-11-14 16:57:59,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:59,660 - INFO - Going to convert document batch...
2025-11-14 16:57:59,662 - INFO - Processing document 8-K_2023-07-28
2025-11-14 16:57:59,724 - INFO - Finished converting document 8-K_2023-07-28 in 0.19 sec.


Converted 'data\edgar_documents\LIN\8-K_2023-07-27' --> 'data\processed_data\LIN\8-K_2023-07-27.md'


2025-11-14 16:57:59,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:59,812 - INFO - Going to convert document batch...
2025-11-14 16:57:59,813 - INFO - Processing document 8-K_2023-10-26
2025-11-14 16:57:59,834 - INFO - Finished converting document 8-K_2023-10-26 in 0.08 sec.
2025-11-14 16:57:59,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:57:59,893 - INFO - Going to convert document batch...
2025-11-14 16:57:59,893 - INFO - Processing document 8-K_2023-12-06
2025-11-14 16:57:59,936 - INFO - Finished converting document 8-K_2023-12-06 in 0.08 sec.


Converted 'data\edgar_documents\LIN\8-K_2023-07-28' --> 'data\processed_data\LIN\8-K_2023-07-28.md'
Converted 'data\edgar_documents\LIN\8-K_2023-10-26' --> 'data\processed_data\LIN\8-K_2023-10-26.md'


2025-11-14 16:58:00,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:00,077 - INFO - Going to convert document batch...
2025-11-14 16:58:00,078 - INFO - Processing document 8-K_2024-02-06
2025-11-14 16:58:00,115 - INFO - Finished converting document 8-K_2024-02-06 in 0.16 sec.


Converted 'data\edgar_documents\LIN\8-K_2023-12-06' --> 'data\processed_data\LIN\8-K_2023-12-06.md'
Converted 'data\edgar_documents\LIN\8-K_2024-02-06' --> 'data\processed_data\LIN\8-K_2024-02-06.md'


2025-11-14 16:58:00,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:00,186 - INFO - Going to convert document batch...
2025-11-14 16:58:00,187 - INFO - Processing document 8-K_2024-02-14
2025-11-14 16:58:00,219 - INFO - Finished converting document 8-K_2024-02-14 in 0.09 sec.
2025-11-14 16:58:00,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:00,276 - INFO - Going to convert document batch...
2025-11-14 16:58:00,277 - INFO - Processing document 8-K_2024-02-28
2025-11-14 16:58:00,297 - INFO - Finished converting document 8-K_2024-02-28 in 0.06 sec.
2025-11-14 16:58:00,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:00,334 - INFO - Going to convert document batch...
2025-11-14 16:58:00,334 - INFO - Processing document 8-K_2024-04-30
2025-11-14 16:58:00,355 - INFO - Finished converting document 8-K_2024-04-30 in 0.05 sec.
2025-11-14 16:58:00,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\LIN\8-K_2024-02-14' --> 'data\processed_data\LIN\8-K_2024-02-14.md'
Converted 'data\edgar_documents\LIN\8-K_2024-02-28' --> 'data\processed_data\LIN\8-K_2024-02-28.md'
Converted 'data\edgar_documents\LIN\8-K_2024-04-30' --> 'data\processed_data\LIN\8-K_2024-04-30.md'


2025-11-14 16:58:00,439 - INFO - Finished converting document 8-K_2024-05-02 in 0.06 sec.
2025-11-14 16:58:00,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:00,560 - INFO - Going to convert document batch...
2025-11-14 16:58:00,561 - INFO - Processing document 8-K_2024-06-04
2025-11-14 16:58:00,599 - INFO - Finished converting document 8-K_2024-06-04 in 0.12 sec.


Converted 'data\edgar_documents\LIN\8-K_2024-05-02' --> 'data\processed_data\LIN\8-K_2024-05-02.md'
Converted 'data\edgar_documents\LIN\8-K_2024-06-04' --> 'data\processed_data\LIN\8-K_2024-06-04.md'


2025-11-14 16:58:00,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:00,715 - INFO - Going to convert document batch...
2025-11-14 16:58:00,716 - INFO - Processing document 8-K_2024-08-02
2025-11-14 16:58:01,126 - INFO - Finished converting document 8-K_2024-08-02 in 0.52 sec.
2025-11-14 16:58:01,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:01,193 - INFO - Going to convert document batch...
2025-11-14 16:58:01,195 - INFO - Processing document 8-K_2024-10-31
2025-11-14 16:58:01,215 - INFO - Finished converting document 8-K_2024-10-31 in 0.06 sec.
2025-11-14 16:58:01,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:01,261 - INFO - Going to convert document batch...
2025-11-14 16:58:01,262 - INFO - Processing document 8-K_2024-11-04
2025-11-14 16:58:01,282 - INFO - Finished converting document 8-K_2024-11-04 in 0.05 sec.
2025-11-14 16:58:01,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\LIN\8-K_2024-08-02' --> 'data\processed_data\LIN\8-K_2024-08-02.md'
Converted 'data\edgar_documents\LIN\8-K_2024-10-31' --> 'data\processed_data\LIN\8-K_2024-10-31.md'
Converted 'data\edgar_documents\LIN\8-K_2024-11-04' --> 'data\processed_data\LIN\8-K_2024-11-04.md'


2025-11-14 16:58:01,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:01,392 - INFO - Going to convert document batch...
2025-11-14 16:58:01,393 - INFO - Processing document 8-K_2024-12-04
2025-11-14 16:58:01,421 - INFO - Finished converting document 8-K_2024-12-04 in 0.06 sec.
2025-11-14 16:58:01,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:01,476 - INFO - Going to convert document batch...
2025-11-14 16:58:01,477 - INFO - Processing document 8-K_2025-02-06
2025-11-14 16:58:01,498 - INFO - Finished converting document 8-K_2025-02-06 in 0.06 sec.
2025-11-14 16:58:01,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:01,537 - INFO - Going to convert document batch...
2025-11-14 16:58:01,538 - INFO - Processing document 8-K_2025-02-18
2025-11-14 16:58:01,564 - INFO - Finished converting document 8-K_2025-02-18 in 0.05 sec.


Converted 'data\edgar_documents\LIN\8-K_2024-12-02' --> 'data\processed_data\LIN\8-K_2024-12-02.md'
Converted 'data\edgar_documents\LIN\8-K_2024-12-04' --> 'data\processed_data\LIN\8-K_2024-12-04.md'
Converted 'data\edgar_documents\LIN\8-K_2025-02-06' --> 'data\processed_data\LIN\8-K_2025-02-06.md'


2025-11-14 16:58:01,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:01,612 - INFO - Going to convert document batch...
2025-11-14 16:58:01,667 - INFO - Processing document 8-K_2025-05-01
2025-11-14 16:58:01,720 - INFO - Finished converting document 8-K_2025-05-01 in 0.14 sec.


Converted 'data\edgar_documents\LIN\8-K_2025-02-18' --> 'data\processed_data\LIN\8-K_2025-02-18.md'
Converted 'data\edgar_documents\LIN\8-K_2025-05-01' --> 'data\processed_data\LIN\8-K_2025-05-01.md'


2025-11-14 16:58:01,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:01,799 - INFO - Going to convert document batch...
2025-11-14 16:58:01,799 - INFO - Processing document 8-K_2025-06-05
2025-11-14 16:58:01,845 - INFO - Finished converting document 8-K_2025-06-05 in 0.11 sec.
2025-11-14 16:58:01,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:01,912 - INFO - Going to convert document batch...
2025-11-14 16:58:01,913 - INFO - Processing document 8-K_2025-08-01
2025-11-14 16:58:01,975 - INFO - Finished converting document 8-K_2025-08-01 in 0.11 sec.


Converted 'data\edgar_documents\LIN\8-K_2025-06-05' --> 'data\processed_data\LIN\8-K_2025-06-05.md'
Converted 'data\edgar_documents\LIN\8-K_2025-08-01' --> 'data\processed_data\LIN\8-K_2025-08-01.md'


2025-11-14 16:58:02,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:02,076 - INFO - Going to convert document batch...
2025-11-14 16:58:02,076 - INFO - Processing document 8-K_2025-08-07
2025-11-14 16:58:02,101 - INFO - Finished converting document 8-K_2025-08-07 in 0.06 sec.
2025-11-14 16:58:02,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:02,201 - INFO - Going to convert document batch...
2025-11-14 16:58:02,203 - INFO - Processing document 8-K_2025-09-29
2025-11-14 16:58:02,240 - INFO - Finished converting document 8-K_2025-09-29 in 0.11 sec.
2025-11-14 16:58:02,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:02,295 - INFO - Going to convert document batch...
2025-11-14 16:58:02,296 - INFO - Processing document 8-K_2025-10-31
2025-11-14 16:58:02,317 - INFO - Finished converting document 8-K_2025-10-31 in 0.05 sec.


Converted 'data\edgar_documents\LIN\8-K_2025-08-07' --> 'data\processed_data\LIN\8-K_2025-08-07.md'
Converted 'data\edgar_documents\LIN\8-K_2025-09-29' --> 'data\processed_data\LIN\8-K_2025-09-29.md'


2025-11-14 16:58:02,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\8-K_2025-10-31' --> 'data\processed_data\LIN\8-K_2025-10-31.md'


2025-11-14 16:58:03,528 - INFO - Going to convert document batch...
2025-11-14 16:58:03,528 - INFO - Processing document DEF-14A_2023-05-01
2025-11-14 16:58:04,973 - INFO - Finished converting document DEF-14A_2023-05-01 in 2.64 sec.
2025-11-14 16:58:05,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\DEF-14A_2023-05-01' --> 'data\processed_data\LIN\DEF-14A_2023-05-01.md'


2025-11-14 16:58:06,723 - INFO - Going to convert document batch...
2025-11-14 16:58:06,724 - INFO - Processing document DEF-14A_2024-04-29
2025-11-14 16:58:07,994 - INFO - Finished converting document DEF-14A_2024-04-29 in 2.30 sec.
2025-11-14 16:58:08,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\DEF-14A_2024-04-29' --> 'data\processed_data\LIN\DEF-14A_2024-04-29.md'


2025-11-14 16:58:11,109 - INFO - Going to convert document batch...
2025-11-14 16:58:11,109 - INFO - Processing document DEF-14A_2025-04-30
2025-11-14 16:58:13,784 - INFO - Finished converting document DEF-14A_2025-04-30 in 5.00 sec.
2025-11-14 16:58:14,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LIN\DEF-14A_2025-04-30' --> 'data\processed_data\LIN\DEF-14A_2025-04-30.md'
Processed 94 new files. Errors: 0
Found 216 files to process in data\edgar_documents\LLY


2025-11-14 16:58:15,773 - INFO - Going to convert document batch...
2025-11-14 16:58:15,774 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:58:15,775 - INFO - Processing document 10-K_2023-02-22
2025-11-14 16:58:17,906 - INFO - Finished converting document 10-K_2023-02-22 in 3.55 sec.
2025-11-14 16:58:18,696 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-K_2023-02-22' --> 'data\processed_data\LLY\10-K_2023-02-22.md'


2025-11-14 16:58:19,524 - INFO - Going to convert document batch...
2025-11-14 16:58:19,526 - INFO - Processing document 10-K_2024-02-21
2025-11-14 16:58:21,897 - INFO - Finished converting document 10-K_2024-02-21 in 3.33 sec.
2025-11-14 16:58:22,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-K_2024-02-21' --> 'data\processed_data\LLY\10-K_2024-02-21.md'


2025-11-14 16:58:23,553 - INFO - Going to convert document batch...
2025-11-14 16:58:23,555 - INFO - Processing document 10-K_2025-02-19
2025-11-14 16:58:26,005 - INFO - Finished converting document 10-K_2025-02-19 in 3.36 sec.
2025-11-14 16:58:26,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-K_2025-02-19' --> 'data\processed_data\LLY\10-K_2025-02-19.md'


2025-11-14 16:58:27,237 - INFO - Going to convert document batch...
2025-11-14 16:58:27,238 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 16:58:28,021 - INFO - Finished converting document 10-Q_2023-04-27 in 1.27 sec.
2025-11-14 16:58:28,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-Q_2023-04-27' --> 'data\processed_data\LLY\10-Q_2023-04-27.md'


2025-11-14 16:58:29,687 - INFO - Going to convert document batch...
2025-11-14 16:58:29,687 - INFO - Processing document 10-Q_2023-08-08
2025-11-14 16:58:30,873 - INFO - Finished converting document 10-Q_2023-08-08 in 2.45 sec.
2025-11-14 16:58:31,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-Q_2023-08-08' --> 'data\processed_data\LLY\10-Q_2023-08-08.md'


2025-11-14 16:58:32,293 - INFO - Going to convert document batch...
2025-11-14 16:58:32,295 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 16:58:33,801 - INFO - Finished converting document 10-Q_2023-11-02 in 2.28 sec.
2025-11-14 16:58:34,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-Q_2023-11-02' --> 'data\processed_data\LLY\10-Q_2023-11-02.md'


2025-11-14 16:58:34,953 - INFO - Going to convert document batch...
2025-11-14 16:58:34,953 - INFO - Processing document 10-Q_2024-04-30
2025-11-14 16:58:35,739 - INFO - Finished converting document 10-Q_2024-04-30 in 1.44 sec.
2025-11-14 16:58:36,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-Q_2024-04-30' --> 'data\processed_data\LLY\10-Q_2024-04-30.md'


2025-11-14 16:58:36,849 - INFO - Going to convert document batch...
2025-11-14 16:58:36,850 - INFO - Processing document 10-Q_2024-08-08
2025-11-14 16:58:38,465 - INFO - Finished converting document 10-Q_2024-08-08 in 2.33 sec.
2025-11-14 16:58:39,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-Q_2024-08-08' --> 'data\processed_data\LLY\10-Q_2024-08-08.md'


2025-11-14 16:58:39,605 - INFO - Going to convert document batch...
2025-11-14 16:58:39,605 - INFO - Processing document 10-Q_2024-10-30
2025-11-14 16:58:40,849 - INFO - Finished converting document 10-Q_2024-10-30 in 1.92 sec.
2025-11-14 16:58:41,560 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-Q_2024-10-30' --> 'data\processed_data\LLY\10-Q_2024-10-30.md'


2025-11-14 16:58:42,382 - INFO - Going to convert document batch...
2025-11-14 16:58:42,383 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 16:58:43,022 - INFO - Finished converting document 10-Q_2025-05-01 in 1.52 sec.
2025-11-14 16:58:43,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-Q_2025-05-01' --> 'data\processed_data\LLY\10-Q_2025-05-01.md'


2025-11-14 16:58:44,022 - INFO - Going to convert document batch...
2025-11-14 16:58:44,022 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 16:58:45,670 - INFO - Finished converting document 10-Q_2025-08-07 in 2.33 sec.
2025-11-14 16:58:46,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\10-Q_2025-08-07' --> 'data\processed_data\LLY\10-Q_2025-08-07.md'


2025-11-14 16:58:46,695 - INFO - Going to convert document batch...
2025-11-14 16:58:46,696 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 16:58:47,549 - INFO - Finished converting document 10-Q_2025-10-30 in 1.45 sec.
2025-11-14 16:58:47,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,010 - INFO - Going to convert document batch...
2025-11-14 16:58:48,010 - INFO - Processing document 4_2023-01-19
2025-11-14 16:58:48,031 - INFO - Finished converting document 4_2023-01-19 in 0.08 sec.
2025-11-14 16:58:48,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,082 - INFO - Going to convert document batch...
2025-11-14 16:58:48,082 - INFO - Processing document 4_2023-02-03
2025-11-14 16:58:48,104 - INFO - Finished converting document 4_2023-02-03 in 0.05 sec.


Converted 'data\edgar_documents\LLY\10-Q_2025-10-30' --> 'data\processed_data\LLY\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\LLY\4_2023-01-19' --> 'data\processed_data\LLY\4_2023-01-19.md'
Converted 'data\edgar_documents\LLY\4_2023-02-03' --> 'data\processed_data\LLY\4_2023-02-03.md'


2025-11-14 16:58:48,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,151 - INFO - Going to convert document batch...
2025-11-14 16:58:48,152 - INFO - Processing document 4_2023-02-14
2025-11-14 16:58:48,177 - INFO - Finished converting document 4_2023-02-14 in 0.05 sec.
2025-11-14 16:58:48,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,245 - INFO - Going to convert document batch...
2025-11-14 16:58:48,245 - INFO - Processing document 4_2023-02-21
2025-11-14 16:58:48,271 - INFO - Finished converting document 4_2023-02-21 in 0.05 sec.
2025-11-14 16:58:48,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,325 - INFO - Going to convert document batch...
2025-11-14 16:58:48,326 - INFO - Processing document 4_2023-02-22
2025-11-14 16:58:48,348 - INFO - Finished converting document 4_2023-02-22 in 0.05 sec.
2025-11-14 16:58:48,391 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025

Converted 'data\edgar_documents\LLY\4_2023-02-14' --> 'data\processed_data\LLY\4_2023-02-14.md'
Converted 'data\edgar_documents\LLY\4_2023-02-21' --> 'data\processed_data\LLY\4_2023-02-21.md'
Converted 'data\edgar_documents\LLY\4_2023-02-22' --> 'data\processed_data\LLY\4_2023-02-22.md'
Error processing data\edgar_documents\LLY\4_2023-02-23: File format not allowed: data\edgar_documents\LLY\4_2023-02-23


2025-11-14 16:58:48,413 - ERROR - Input document 4_2023-02-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:58:48,416 - INFO - Going to convert document batch...
2025-11-14 16:58:48,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,443 - INFO - Going to convert document batch...
2025-11-14 16:58:48,445 - INFO - Processing document 4_2023-03-01
2025-11-14 16:58:48,481 - INFO - Finished converting document 4_2023-03-01 in 0.06 sec.
2025-11-14 16:58:48,547 - INFO - detec

Error processing data\edgar_documents\LLY\4_2023-02-24: File format not allowed: data\edgar_documents\LLY\4_2023-02-24
Converted 'data\edgar_documents\LLY\4_2023-03-01' --> 'data\processed_data\LLY\4_2023-03-01.md'


2025-11-14 16:58:48,603 - INFO - Processing document 4_2023-03-02
2025-11-14 16:58:48,635 - INFO - Finished converting document 4_2023-03-02 in 0.12 sec.
2025-11-14 16:58:48,707 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,720 - INFO - Going to convert document batch...
2025-11-14 16:58:48,721 - INFO - Processing document 4_2023-03-13
2025-11-14 16:58:48,753 - INFO - Finished converting document 4_2023-03-13 in 0.09 sec.
2025-11-14 16:58:48,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,799 - INFO - Going to convert document batch...
2025-11-14 16:58:48,800 - INFO - Processing document 4_2023-03-22
2025-11-14 16:58:48,821 - INFO - Finished converting document 4_2023-03-22 in 0.03 sec.


Converted 'data\edgar_documents\LLY\4_2023-03-02' --> 'data\processed_data\LLY\4_2023-03-02.md'
Converted 'data\edgar_documents\LLY\4_2023-03-13' --> 'data\processed_data\LLY\4_2023-03-13.md'


2025-11-14 16:58:48,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,875 - INFO - Going to convert document batch...
2025-11-14 16:58:48,876 - INFO - Processing document 4_2023-03-27
2025-11-14 16:58:48,900 - INFO - Finished converting document 4_2023-03-27 in 0.05 sec.
2025-11-14 16:58:48,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:48,996 - INFO - Going to convert document batch...
2025-11-14 16:58:49,035 - INFO - Processing document 4_2023-04-03


Converted 'data\edgar_documents\LLY\4_2023-03-22' --> 'data\processed_data\LLY\4_2023-03-22.md'
Converted 'data\edgar_documents\LLY\4_2023-03-27' --> 'data\processed_data\LLY\4_2023-03-27.md'


2025-11-14 16:58:49,099 - INFO - Finished converting document 4_2023-04-03 in 0.14 sec.
2025-11-14 16:58:49,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:49,195 - INFO - Going to convert document batch...
2025-11-14 16:58:49,195 - INFO - Processing document 4_2023-04-04
2025-11-14 16:58:49,220 - INFO - Finished converting document 4_2023-04-04 in 0.08 sec.
2025-11-14 16:58:49,270 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:49,288 - INFO - Going to convert document batch...
2025-11-14 16:58:49,290 - INFO - Processing document 4_2023-04-06
2025-11-14 16:58:49,325 - INFO - Finished converting document 4_2023-04-06 in 0.08 sec.


Converted 'data\edgar_documents\LLY\4_2023-04-03' --> 'data\processed_data\LLY\4_2023-04-03.md'
Converted 'data\edgar_documents\LLY\4_2023-04-04' --> 'data\processed_data\LLY\4_2023-04-04.md'


2025-11-14 16:58:49,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:49,394 - INFO - Going to convert document batch...
2025-11-14 16:58:49,395 - INFO - Processing document 4_2023-04-07
2025-11-14 16:58:49,425 - INFO - Finished converting document 4_2023-04-07 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2023-04-06' --> 'data\processed_data\LLY\4_2023-04-06.md'
Converted 'data\edgar_documents\LLY\4_2023-04-07' --> 'data\processed_data\LLY\4_2023-04-07.md'


2025-11-14 16:58:49,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:49,600 - INFO - Going to convert document batch...
2025-11-14 16:58:49,601 - INFO - Processing document 4_2023-04-19
2025-11-14 16:58:49,628 - INFO - Finished converting document 4_2023-04-19 in 0.09 sec.
2025-11-14 16:58:49,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:49,697 - INFO - Going to convert document batch...
2025-11-14 16:58:49,698 - INFO - Processing document 4_2023-05-01
2025-11-14 16:58:49,731 - INFO - Finished converting document 4_2023-05-01 in 0.08 sec.
2025-11-14 16:58:49,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:49,798 - INFO - Going to convert document batch...
2025-11-14 16:58:49,798 - INFO - Processing document 4_2023-05-03
2025-11-14 16:58:49,823 - INFO - Finished converting document 4_2023-05-03 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2023-04-19' --> 'data\processed_data\LLY\4_2023-04-19.md'
Converted 'data\edgar_documents\LLY\4_2023-05-01' --> 'data\processed_data\LLY\4_2023-05-01.md'


2025-11-14 16:58:49,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:49,893 - INFO - Going to convert document batch...
2025-11-14 16:58:49,894 - INFO - Processing document 4_2023-05-04
2025-11-14 16:58:49,945 - INFO - Finished converting document 4_2023-05-04 in 0.08 sec.


Converted 'data\edgar_documents\LLY\4_2023-05-03' --> 'data\processed_data\LLY\4_2023-05-03.md'
Converted 'data\edgar_documents\LLY\4_2023-05-04' --> 'data\processed_data\LLY\4_2023-05-04.md'


2025-11-14 16:58:50,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:50,119 - INFO - Going to convert document batch...
2025-11-14 16:58:50,119 - INFO - Processing document 4_2023-05-15
2025-11-14 16:58:50,146 - INFO - Finished converting document 4_2023-05-15 in 0.08 sec.
2025-11-14 16:58:50,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:50,208 - INFO - Going to convert document batch...
2025-11-14 16:58:50,210 - INFO - Processing document 4_2023-05-16
2025-11-14 16:58:50,232 - INFO - Finished converting document 4_2023-05-16 in 0.05 sec.
2025-11-14 16:58:50,270 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:50,283 - INFO - Going to convert document batch...
2025-11-14 16:58:50,284 - INFO - Processing document 4_2023-05-22
2025-11-14 16:58:50,318 - INFO - Finished converting document 4_2023-05-22 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2023-05-15' --> 'data\processed_data\LLY\4_2023-05-15.md'
Converted 'data\edgar_documents\LLY\4_2023-05-16' --> 'data\processed_data\LLY\4_2023-05-16.md'


2025-11-14 16:58:50,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2023-05-22' --> 'data\processed_data\LLY\4_2023-05-22.md'


2025-11-14 16:58:50,849 - INFO - Going to convert document batch...
2025-11-14 16:58:50,850 - INFO - Processing document 4_2023-06-02
2025-11-14 16:58:50,895 - INFO - Finished converting document 4_2023-06-02 in 0.53 sec.
2025-11-14 16:58:51,061 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:51,074 - INFO - Going to convert document batch...
2025-11-14 16:58:51,076 - INFO - Processing document 4_2023-06-15
2025-11-14 16:58:51,102 - INFO - Finished converting document 4_2023-06-15 in 0.08 sec.
2025-11-14 16:58:51,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:51,167 - INFO - Going to convert document batch...
2025-11-14 16:58:51,168 - INFO - Processing document 4_2023-06-16
2025-11-14 16:58:51,205 - INFO - Finished converting document 4_2023-06-16 in 0.08 sec.


Converted 'data\edgar_documents\LLY\4_2023-06-02' --> 'data\processed_data\LLY\4_2023-06-02.md'
Converted 'data\edgar_documents\LLY\4_2023-06-15' --> 'data\processed_data\LLY\4_2023-06-15.md'


2025-11-14 16:58:51,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:51,274 - INFO - Going to convert document batch...
2025-11-14 16:58:51,275 - INFO - Processing document 4_2023-06-20
2025-11-14 16:58:51,299 - INFO - Finished converting document 4_2023-06-20 in 0.05 sec.
2025-11-14 16:58:51,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:51,359 - INFO - Going to convert document batch...
2025-11-14 16:58:51,360 - INFO - Processing document 4_2023-06-21
2025-11-14 16:58:51,384 - INFO - Finished converting document 4_2023-06-21 in 0.05 sec.
2025-11-14 16:58:51,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:51,440 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\4_2023-06-16' --> 'data\processed_data\LLY\4_2023-06-16.md'
Converted 'data\edgar_documents\LLY\4_2023-06-20' --> 'data\processed_data\LLY\4_2023-06-20.md'
Converted 'data\edgar_documents\LLY\4_2023-06-21' --> 'data\processed_data\LLY\4_2023-06-21.md'


2025-11-14 16:58:51,441 - INFO - Processing document 4_2023-06-22
2025-11-14 16:58:51,463 - INFO - Finished converting document 4_2023-06-22 in 0.06 sec.
2025-11-14 16:58:51,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:51,764 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\4_2023-06-22' --> 'data\processed_data\LLY\4_2023-06-22.md'


2025-11-14 16:58:51,765 - INFO - Processing document 4_2023-06-23
2025-11-14 16:58:51,797 - INFO - Finished converting document 4_2023-06-23 in 0.22 sec.
2025-11-14 16:58:51,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:51,937 - INFO - Going to convert document batch...
2025-11-14 16:58:51,939 - INFO - Processing document 4_2023-06-30
2025-11-14 16:58:51,976 - INFO - Finished converting document 4_2023-06-30 in 0.12 sec.


Converted 'data\edgar_documents\LLY\4_2023-06-23' --> 'data\processed_data\LLY\4_2023-06-23.md'
Converted 'data\edgar_documents\LLY\4_2023-06-30' --> 'data\processed_data\LLY\4_2023-06-30.md'


2025-11-14 16:58:52,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:52,087 - INFO - Going to convert document batch...
2025-11-14 16:58:52,089 - INFO - Processing document 4_2023-07-03
2025-11-14 16:58:52,126 - INFO - Finished converting document 4_2023-07-03 in 0.11 sec.
2025-11-14 16:58:52,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:52,221 - INFO - Going to convert document batch...
2025-11-14 16:58:52,222 - INFO - Processing document 4_2023-07-18
2025-11-14 16:58:52,245 - INFO - Finished converting document 4_2023-07-18 in 0.08 sec.
2025-11-14 16:58:52,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:52,289 - INFO - Going to convert document batch...
2025-11-14 16:58:52,291 - INFO - Processing document 4_2023-07-24
2025-11-14 16:58:52,317 - INFO - Finished converting document 4_2023-07-24 in 0.05 sec.
2025-11-14 16:58:52,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2023-07-03' --> 'data\processed_data\LLY\4_2023-07-03.md'
Converted 'data\edgar_documents\LLY\4_2023-07-18' --> 'data\processed_data\LLY\4_2023-07-18.md'
Converted 'data\edgar_documents\LLY\4_2023-07-24' --> 'data\processed_data\LLY\4_2023-07-24.md'


2025-11-14 16:58:52,403 - INFO - Going to convert document batch...
2025-11-14 16:58:52,406 - INFO - Processing document 4_2023-08-09
2025-11-14 16:58:52,582 - INFO - Finished converting document 4_2023-08-09 in 0.23 sec.
2025-11-14 16:58:52,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:52,724 - INFO - Going to convert document batch...
2025-11-14 16:58:52,725 - INFO - Processing document 4_2023-08-10
2025-11-14 16:58:52,746 - INFO - Finished converting document 4_2023-08-10 in 0.11 sec.
2025-11-14 16:58:52,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:52,796 - INFO - Going to convert document batch...
2025-11-14 16:58:52,796 - INFO - Processing document 4_2023-08-11
2025-11-14 16:58:52,825 - INFO - Finished converting document 4_2023-08-11 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2023-08-09' --> 'data\processed_data\LLY\4_2023-08-09.md'
Converted 'data\edgar_documents\LLY\4_2023-08-10' --> 'data\processed_data\LLY\4_2023-08-10.md'


2025-11-14 16:58:52,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:52,881 - INFO - Going to convert document batch...
2025-11-14 16:58:52,882 - INFO - Processing document 4_2023-08-14
2025-11-14 16:58:52,930 - INFO - Finished converting document 4_2023-08-14 in 0.08 sec.
2025-11-14 16:58:52,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:52,994 - INFO - Going to convert document batch...
2025-11-14 16:58:52,995 - INFO - Processing document 4_2023-08-15
2025-11-14 16:58:53,020 - INFO - Finished converting document 4_2023-08-15 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2023-08-11' --> 'data\processed_data\LLY\4_2023-08-11.md'
Converted 'data\edgar_documents\LLY\4_2023-08-14' --> 'data\processed_data\LLY\4_2023-08-14.md'


2025-11-14 16:58:53,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:53,083 - INFO - Going to convert document batch...
2025-11-14 16:58:53,084 - INFO - Processing document 4_2023-08-16
2025-11-14 16:58:53,123 - INFO - Finished converting document 4_2023-08-16 in 0.08 sec.


Converted 'data\edgar_documents\LLY\4_2023-08-15' --> 'data\processed_data\LLY\4_2023-08-15.md'


2025-11-14 16:58:53,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:53,283 - INFO - Going to convert document batch...
2025-11-14 16:58:53,284 - INFO - Processing document 4_2023-08-22
2025-11-14 16:58:53,313 - INFO - Finished converting document 4_2023-08-22 in 0.06 sec.
2025-11-14 16:58:53,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:53,366 - INFO - Going to convert document batch...
2025-11-14 16:58:53,367 - INFO - Processing document 4_2023-08-24
2025-11-14 16:58:53,389 - INFO - Finished converting document 4_2023-08-24 in 0.05 sec.
2025-11-14 16:58:53,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2023-08-16' --> 'data\processed_data\LLY\4_2023-08-16.md'
Converted 'data\edgar_documents\LLY\4_2023-08-22' --> 'data\processed_data\LLY\4_2023-08-22.md'
Converted 'data\edgar_documents\LLY\4_2023-08-24' --> 'data\processed_data\LLY\4_2023-08-24.md'


2025-11-14 16:58:53,453 - INFO - Going to convert document batch...
2025-11-14 16:58:53,454 - INFO - Processing document 4_2023-08-25
2025-11-14 16:58:53,482 - INFO - Finished converting document 4_2023-08-25 in 0.08 sec.
2025-11-14 16:58:53,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:53,540 - INFO - Going to convert document batch...
2025-11-14 16:58:53,541 - INFO - Processing document 4_2023-08-28
2025-11-14 16:58:53,571 - INFO - Finished converting document 4_2023-08-28 in 0.05 sec.
2025-11-14 16:58:53,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:53,624 - INFO - Going to convert document batch...
2025-11-14 16:58:53,625 - INFO - Processing document 4_2023-08-29
2025-11-14 16:58:53,655 - INFO - Finished converting document 4_2023-08-29 in 0.06 sec.
2025-11-14 16:58:53,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2023-08-25' --> 'data\processed_data\LLY\4_2023-08-25.md'
Converted 'data\edgar_documents\LLY\4_2023-08-28' --> 'data\processed_data\LLY\4_2023-08-28.md'
Converted 'data\edgar_documents\LLY\4_2023-08-29' --> 'data\processed_data\LLY\4_2023-08-29.md'


2025-11-14 16:58:53,722 - INFO - Going to convert document batch...
2025-11-14 16:58:53,723 - INFO - Processing document 4_2023-08-30
2025-11-14 16:58:53,753 - INFO - Finished converting document 4_2023-08-30 in 0.06 sec.
2025-11-14 16:58:53,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:53,936 - INFO - Going to convert document batch...
2025-11-14 16:58:53,938 - INFO - Processing document 4_2023-08-31
2025-11-14 16:58:53,978 - INFO - Finished converting document 4_2023-08-31 in 0.11 sec.


Converted 'data\edgar_documents\LLY\4_2023-08-30' --> 'data\processed_data\LLY\4_2023-08-30.md'
Converted 'data\edgar_documents\LLY\4_2023-08-31' --> 'data\processed_data\LLY\4_2023-08-31.md'


2025-11-14 16:58:54,071 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:54,091 - INFO - Going to convert document batch...
2025-11-14 16:58:54,092 - INFO - Processing document 4_2023-09-01
2025-11-14 16:58:54,122 - INFO - Finished converting document 4_2023-09-01 in 0.11 sec.
2025-11-14 16:58:54,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:54,188 - INFO - Going to convert document batch...
2025-11-14 16:58:54,190 - INFO - Processing document 4_2023-09-08
2025-11-14 16:58:54,230 - INFO - Finished converting document 4_2023-09-08 in 0.09 sec.
2025-11-14 16:58:54,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:54,324 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\4_2023-09-01' --> 'data\processed_data\LLY\4_2023-09-01.md'
Converted 'data\edgar_documents\LLY\4_2023-09-08' --> 'data\processed_data\LLY\4_2023-09-08.md'


2025-11-14 16:58:54,325 - INFO - Processing document 4_2023-09-13
2025-11-14 16:58:54,364 - INFO - Finished converting document 4_2023-09-13 in 0.09 sec.
2025-11-14 16:58:54,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:54,430 - INFO - Going to convert document batch...
2025-11-14 16:58:54,431 - INFO - Processing document 4_2023-09-20
2025-11-14 16:58:54,456 - INFO - Finished converting document 4_2023-09-20 in 0.06 sec.
2025-11-14 16:58:54,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:54,515 - INFO - Going to convert document batch...
2025-11-14 16:58:54,516 - INFO - Processing document 4_2023-10-12
2025-11-14 16:58:54,557 - INFO - Finished converting document 4_2023-10-12 in 0.08 sec.


Converted 'data\edgar_documents\LLY\4_2023-09-13' --> 'data\processed_data\LLY\4_2023-09-13.md'
Converted 'data\edgar_documents\LLY\4_2023-09-20' --> 'data\processed_data\LLY\4_2023-09-20.md'
Converted 'data\edgar_documents\LLY\4_2023-10-12' --> 'data\processed_data\LLY\4_2023-10-12.md'


2025-11-14 16:58:54,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:54,626 - INFO - Going to convert document batch...
2025-11-14 16:58:54,627 - INFO - Processing document 4_2023-10-17
2025-11-14 16:58:54,668 - INFO - Finished converting document 4_2023-10-17 in 0.08 sec.
2025-11-14 16:58:54,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:54,742 - INFO - Going to convert document batch...
2025-11-14 16:58:54,743 - INFO - Processing document 4_2023-11-06
2025-11-14 16:58:54,778 - INFO - Finished converting document 4_2023-11-06 in 0.08 sec.
2025-11-14 16:58:54,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:54,852 - INFO - Going to convert document batch...
2025-11-14 16:58:54,853 - INFO - Processing document 4_2023-11-13
2025-11-14 16:58:54,876 - INFO - Finished converting document 4_2023-11-13 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2023-10-17' --> 'data\processed_data\LLY\4_2023-10-17.md'
Converted 'data\edgar_documents\LLY\4_2023-11-06' --> 'data\processed_data\LLY\4_2023-11-06.md'


2025-11-14 16:58:54,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:54,931 - INFO - Going to convert document batch...
2025-11-14 16:58:54,932 - INFO - Processing document 4_2023-11-15
2025-11-14 16:58:54,971 - INFO - Finished converting document 4_2023-11-15 in 0.08 sec.


Converted 'data\edgar_documents\LLY\4_2023-11-13' --> 'data\processed_data\LLY\4_2023-11-13.md'
Converted 'data\edgar_documents\LLY\4_2023-11-15' --> 'data\processed_data\LLY\4_2023-11-15.md'


2025-11-14 16:58:55,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:55,148 - INFO - Going to convert document batch...
2025-11-14 16:58:55,149 - INFO - Processing document 4_2023-11-21
2025-11-14 16:58:55,187 - INFO - Finished converting document 4_2023-11-21 in 0.16 sec.
2025-11-14 16:58:55,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:55,391 - INFO - Going to convert document batch...
2025-11-14 16:58:55,392 - INFO - Processing document 4_2023-12-04


Converted 'data\edgar_documents\LLY\4_2023-11-21' --> 'data\processed_data\LLY\4_2023-11-21.md'


2025-11-14 16:58:55,441 - INFO - Finished converting document 4_2023-12-04 in 0.20 sec.
2025-11-14 16:58:55,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:55,548 - INFO - Going to convert document batch...
2025-11-14 16:58:55,549 - INFO - Processing document 4_2023-12-19
2025-11-14 16:58:55,576 - INFO - Finished converting document 4_2023-12-19 in 0.09 sec.
2025-11-14 16:58:55,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:55,665 - INFO - Going to convert document batch...
2025-11-14 16:58:55,666 - INFO - Processing document 4_2024-01-05


Converted 'data\edgar_documents\LLY\4_2023-12-04' --> 'data\processed_data\LLY\4_2023-12-04.md'
Converted 'data\edgar_documents\LLY\4_2023-12-19' --> 'data\processed_data\LLY\4_2023-12-19.md'


2025-11-14 16:58:55,700 - INFO - Finished converting document 4_2024-01-05 in 0.09 sec.
2025-11-14 16:58:55,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:55,791 - INFO - Going to convert document batch...
2025-11-14 16:58:55,792 - INFO - Processing document 4_2024-01-10
2025-11-14 16:58:55,826 - INFO - Finished converting document 4_2024-01-10 in 0.08 sec.
2025-11-14 16:58:55,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:55,880 - INFO - Going to convert document batch...
2025-11-14 16:58:55,881 - INFO - Processing document 4_2024-01-11
2025-11-14 16:58:55,913 - INFO - Finished converting document 4_2024-01-11 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2024-01-05' --> 'data\processed_data\LLY\4_2024-01-05.md'
Converted 'data\edgar_documents\LLY\4_2024-01-10' --> 'data\processed_data\LLY\4_2024-01-10.md'


2025-11-14 16:58:55,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:55,974 - INFO - Going to convert document batch...
2025-11-14 16:58:55,975 - INFO - Processing document 4_2024-01-12
2025-11-14 16:58:56,012 - INFO - Finished converting document 4_2024-01-12 in 0.08 sec.
2025-11-14 16:58:56,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:56,068 - INFO - Going to convert document batch...
2025-11-14 16:58:56,068 - INFO - Processing document 4_2024-01-17
2025-11-14 16:58:56,093 - INFO - Finished converting document 4_2024-01-17 in 0.05 sec.
2025-11-14 16:58:56,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2024-01-11' --> 'data\processed_data\LLY\4_2024-01-11.md'
Converted 'data\edgar_documents\LLY\4_2024-01-12' --> 'data\processed_data\LLY\4_2024-01-12.md'
Converted 'data\edgar_documents\LLY\4_2024-01-17' --> 'data\processed_data\LLY\4_2024-01-17.md'


2025-11-14 16:58:56,140 - INFO - Going to convert document batch...
2025-11-14 16:58:56,141 - INFO - Processing document 4_2024-01-30
2025-11-14 16:58:56,182 - INFO - Finished converting document 4_2024-01-30 in 0.08 sec.
2025-11-14 16:58:56,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:56,332 - INFO - Going to convert document batch...
2025-11-14 16:58:56,333 - INFO - Processing document 4_2024-01-31
2025-11-14 16:58:56,358 - INFO - Finished converting document 4_2024-01-31 in 0.06 sec.
2025-11-14 16:58:56,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:56,416 - INFO - Going to convert document batch...
2025-11-14 16:58:56,417 - INFO - Processing document 4_2024-02-01
2025-11-14 16:58:56,471 - INFO - Finished converting document 4_2024-02-01 in 0.09 sec.


Converted 'data\edgar_documents\LLY\4_2024-01-30' --> 'data\processed_data\LLY\4_2024-01-30.md'
Converted 'data\edgar_documents\LLY\4_2024-01-31' --> 'data\processed_data\LLY\4_2024-01-31.md'


2025-11-14 16:58:56,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:56,573 - INFO - Going to convert document batch...
2025-11-14 16:58:56,573 - INFO - Processing document 4_2024-02-02
2025-11-14 16:58:56,611 - INFO - Finished converting document 4_2024-02-02 in 0.11 sec.
2025-11-14 16:58:56,681 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:58:56,681 - ERROR - Input document 4_2024-02-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))


Converted 'data\edgar_documents\LLY\4_2024-02-01' --> 'data\processed_data\LLY\4_2024-02-01.md'
Converted 'data\edgar_documents\LLY\4_2024-02-02' --> 'data\processed_data\LLY\4_2024-02-02.md'


2025-11-14 16:58:56,683 - INFO - Going to convert document batch...
2025-11-14 16:58:56,711 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:58:56,711 - ERROR - Input document 4_2024-02-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:58:56,713 - INFO - Going to convert document batch...
2025-11-14 16:58:56,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:56,742 - INFO - Going to convert document batch...
2025-11-14 16:58:56,743 - INFO - P

Error processing data\edgar_documents\LLY\4_2024-02-07: File format not allowed: data\edgar_documents\LLY\4_2024-02-07
Error processing data\edgar_documents\LLY\4_2024-02-08: File format not allowed: data\edgar_documents\LLY\4_2024-02-08
Converted 'data\edgar_documents\LLY\4_2024-02-09' --> 'data\processed_data\LLY\4_2024-02-09.md'


2025-11-14 16:58:56,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:56,924 - INFO - Going to convert document batch...
2025-11-14 16:58:56,925 - INFO - Processing document 4_2024-02-14
2025-11-14 16:58:56,961 - INFO - Finished converting document 4_2024-02-14 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2024-02-12' --> 'data\processed_data\LLY\4_2024-02-12.md'
Converted 'data\edgar_documents\LLY\4_2024-02-14' --> 'data\processed_data\LLY\4_2024-02-14.md'


2025-11-14 16:58:57,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:57,114 - INFO - Going to convert document batch...
2025-11-14 16:58:57,115 - INFO - Processing document 4_2024-02-16
2025-11-14 16:58:57,147 - INFO - Finished converting document 4_2024-02-16 in 0.09 sec.
2025-11-14 16:58:57,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:57,216 - INFO - Going to convert document batch...
2025-11-14 16:58:57,217 - INFO - Processing document 4_2024-02-20


Converted 'data\edgar_documents\LLY\4_2024-02-16' --> 'data\processed_data\LLY\4_2024-02-16.md'


2025-11-14 16:58:57,578 - INFO - Finished converting document 4_2024-02-20 in 0.41 sec.
2025-11-14 16:58:57,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:57,770 - INFO - Going to convert document batch...
2025-11-14 16:58:57,771 - INFO - Processing document 4_2024-02-21
2025-11-14 16:58:57,794 - INFO - Finished converting document 4_2024-02-21 in 0.08 sec.
2025-11-14 16:58:57,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:57,845 - INFO - Going to convert document batch...
2025-11-14 16:58:57,845 - INFO - Processing document 4_2024-03-11
2025-11-14 16:58:57,872 - INFO - Finished converting document 4_2024-03-11 in 0.06 sec.
2025-11-14 16:58:57,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2024-02-20' --> 'data\processed_data\LLY\4_2024-02-20.md'
Converted 'data\edgar_documents\LLY\4_2024-02-21' --> 'data\processed_data\LLY\4_2024-02-21.md'
Converted 'data\edgar_documents\LLY\4_2024-03-11' --> 'data\processed_data\LLY\4_2024-03-11.md'


2025-11-14 16:58:57,932 - INFO - Going to convert document batch...
2025-11-14 16:58:57,933 - INFO - Processing document 4_2024-03-19
2025-11-14 16:58:57,970 - INFO - Finished converting document 4_2024-03-19 in 0.08 sec.
2025-11-14 16:58:58,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,018 - INFO - Going to convert document batch...
2025-11-14 16:58:58,019 - INFO - Processing document 4_2024-04-16
2025-11-14 16:58:58,040 - INFO - Finished converting document 4_2024-04-16 in 0.03 sec.
2025-11-14 16:58:58,071 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,081 - INFO - Going to convert document batch...
2025-11-14 16:58:58,082 - INFO - Processing document 4_2024-05-21
2025-11-14 16:58:58,102 - INFO - Finished converting document 4_2024-05-21 in 0.03 sec.
2025-11-14 16:58:58,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,163 - INFO - Going to convert document batch...
2025-11-14 16:58:58,164 - 

Converted 'data\edgar_documents\LLY\4_2024-03-19' --> 'data\processed_data\LLY\4_2024-03-19.md'
Converted 'data\edgar_documents\LLY\4_2024-04-16' --> 'data\processed_data\LLY\4_2024-04-16.md'
Converted 'data\edgar_documents\LLY\4_2024-05-21' --> 'data\processed_data\LLY\4_2024-05-21.md'


2025-11-14 16:58:58,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,245 - INFO - Going to convert document batch...
2025-11-14 16:58:58,246 - INFO - Processing document 4_2024-05-23
2025-11-14 16:58:58,273 - INFO - Finished converting document 4_2024-05-23 in 0.05 sec.
2025-11-14 16:58:58,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,343 - INFO - Going to convert document batch...
2025-11-14 16:58:58,343 - INFO - Processing document 4_2024-05-24
2025-11-14 16:58:58,382 - INFO - Finished converting document 4_2024-05-24 in 0.08 sec.


Converted 'data\edgar_documents\LLY\4_2024-05-22' --> 'data\processed_data\LLY\4_2024-05-22.md'
Converted 'data\edgar_documents\LLY\4_2024-05-23' --> 'data\processed_data\LLY\4_2024-05-23.md'


2025-11-14 16:58:58,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,444 - INFO - Going to convert document batch...
2025-11-14 16:58:58,445 - INFO - Processing document 4_2024-05-28
2025-11-14 16:58:58,551 - INFO - Finished converting document 4_2024-05-28 in 0.12 sec.


Converted 'data\edgar_documents\LLY\4_2024-05-24' --> 'data\processed_data\LLY\4_2024-05-24.md'
Converted 'data\edgar_documents\LLY\4_2024-05-28' --> 'data\processed_data\LLY\4_2024-05-28.md'


2025-11-14 16:58:58,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,664 - INFO - Going to convert document batch...
2025-11-14 16:58:58,665 - INFO - Processing document 4_2024-05-29
2025-11-14 16:58:58,694 - INFO - Finished converting document 4_2024-05-29 in 0.09 sec.
2025-11-14 16:58:58,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,774 - INFO - Going to convert document batch...
2025-11-14 16:58:58,776 - INFO - Processing document 4_2024-05-30
2025-11-14 16:58:58,806 - INFO - Finished converting document 4_2024-05-30 in 0.06 sec.
2025-11-14 16:58:58,848 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,861 - INFO - Going to convert document batch...
2025-11-14 16:58:58,863 - INFO - Processing document 4_2024-06-03
2025-11-14 16:58:58,896 - INFO - Finished converting document 4_2024-06-03 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2024-05-29' --> 'data\processed_data\LLY\4_2024-05-29.md'
Converted 'data\edgar_documents\LLY\4_2024-05-30' --> 'data\processed_data\LLY\4_2024-05-30.md'


2025-11-14 16:58:58,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:58,957 - INFO - Going to convert document batch...
2025-11-14 16:58:58,958 - INFO - Processing document 4_2024-06-04
2025-11-14 16:58:59,068 - INFO - Finished converting document 4_2024-06-04 in 0.14 sec.


Converted 'data\edgar_documents\LLY\4_2024-06-03' --> 'data\processed_data\LLY\4_2024-06-03.md'
Converted 'data\edgar_documents\LLY\4_2024-06-04' --> 'data\processed_data\LLY\4_2024-06-04.md'


2025-11-14 16:58:59,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:59,148 - INFO - Going to convert document batch...
2025-11-14 16:58:59,148 - INFO - Processing document 4_2024-06-06
2025-11-14 16:58:59,171 - INFO - Finished converting document 4_2024-06-06 in 0.08 sec.
2025-11-14 16:58:59,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:59,243 - INFO - Going to convert document batch...
2025-11-14 16:58:59,244 - INFO - Processing document 4_2024-06-07
2025-11-14 16:58:59,296 - INFO - Finished converting document 4_2024-06-07 in 0.09 sec.
2025-11-14 16:58:59,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:59,392 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\4_2024-06-06' --> 'data\processed_data\LLY\4_2024-06-06.md'
Converted 'data\edgar_documents\LLY\4_2024-06-07' --> 'data\processed_data\LLY\4_2024-06-07.md'


2025-11-14 16:58:59,393 - INFO - Processing document 4_2024-06-10
2025-11-14 16:58:59,471 - INFO - Finished converting document 4_2024-06-10 in 0.14 sec.
2025-11-14 16:58:59,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:59,593 - INFO - Going to convert document batch...
2025-11-14 16:58:59,594 - INFO - Processing document 4_2024-06-11
2025-11-14 16:58:59,648 - INFO - Finished converting document 4_2024-06-11 in 0.09 sec.
2025-11-14 16:58:59,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:59,730 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\4_2024-06-10' --> 'data\processed_data\LLY\4_2024-06-10.md'
Converted 'data\edgar_documents\LLY\4_2024-06-11' --> 'data\processed_data\LLY\4_2024-06-11.md'


2025-11-14 16:58:59,732 - INFO - Processing document 4_2024-06-17
2025-11-14 16:58:59,776 - INFO - Finished converting document 4_2024-06-17 in 0.09 sec.
2025-11-14 16:58:59,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:59,852 - INFO - Going to convert document batch...
2025-11-14 16:58:59,853 - INFO - Processing document 4_2024-06-18
2025-11-14 16:58:59,875 - INFO - Finished converting document 4_2024-06-18 in 0.06 sec.
2025-11-14 16:58:59,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:59,926 - INFO - Going to convert document batch...
2025-11-14 16:58:59,927 - INFO - Processing document 4_2024-06-21
2025-11-14 16:58:59,950 - INFO - Finished converting document 4_2024-06-21 in 0.05 sec.
2025-11-14 16:58:59,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:58:59,998 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\4_2024-06-17' --> 'data\processed_data\LLY\4_2024-06-17.md'
Converted 'data\edgar_documents\LLY\4_2024-06-18' --> 'data\processed_data\LLY\4_2024-06-18.md'
Converted 'data\edgar_documents\LLY\4_2024-06-21' --> 'data\processed_data\LLY\4_2024-06-21.md'


2025-11-14 16:58:59,999 - INFO - Processing document 4_2024-06-25
2025-11-14 16:59:00,027 - INFO - Finished converting document 4_2024-06-25 in 0.06 sec.
2025-11-14 16:59:00,126 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:00,149 - INFO - Going to convert document batch...
2025-11-14 16:59:00,151 - INFO - Processing document 4_2024-06-26
2025-11-14 16:59:00,196 - INFO - Finished converting document 4_2024-06-26 in 0.08 sec.
2025-11-14 16:59:00,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:00,305 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\4_2024-06-25' --> 'data\processed_data\LLY\4_2024-06-25.md'
Converted 'data\edgar_documents\LLY\4_2024-06-26' --> 'data\processed_data\LLY\4_2024-06-26.md'


2025-11-14 16:59:00,307 - INFO - Processing document 4_2024-07-01
2025-11-14 16:59:00,337 - INFO - Finished converting document 4_2024-07-01 in 0.09 sec.
2025-11-14 16:59:00,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:00,390 - INFO - Going to convert document batch...
2025-11-14 16:59:00,391 - INFO - Processing document 4_2024-07-02
2025-11-14 16:59:00,417 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.
2025-11-14 16:59:00,454 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:00,465 - INFO - Going to convert document batch...
2025-11-14 16:59:00,466 - INFO - Processing document 4_2024-07-03
2025-11-14 16:59:00,486 - INFO - Finished converting document 4_2024-07-03 in 0.05 sec.
2025-11-14 16:59:00,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:00,539 - INFO - Going to convert document batch...
2025-11-14 16:59:00,540 - INFO - Processing document 4_2024-07-08


Converted 'data\edgar_documents\LLY\4_2024-07-01' --> 'data\processed_data\LLY\4_2024-07-01.md'
Converted 'data\edgar_documents\LLY\4_2024-07-02' --> 'data\processed_data\LLY\4_2024-07-02.md'
Converted 'data\edgar_documents\LLY\4_2024-07-03' --> 'data\processed_data\LLY\4_2024-07-03.md'


2025-11-14 16:59:00,564 - INFO - Finished converting document 4_2024-07-08 in 0.05 sec.
2025-11-14 16:59:00,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:00,637 - INFO - Going to convert document batch...
2025-11-14 16:59:00,638 - INFO - Processing document 4_2024-07-09
2025-11-14 16:59:00,702 - INFO - Finished converting document 4_2024-07-09 in 0.11 sec.


Converted 'data\edgar_documents\LLY\4_2024-07-08' --> 'data\processed_data\LLY\4_2024-07-08.md'


2025-11-14 16:59:00,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:00,886 - INFO - Going to convert document batch...
2025-11-14 16:59:00,887 - INFO - Processing document 4_2024-07-11
2025-11-14 16:59:00,934 - INFO - Finished converting document 4_2024-07-11 in 0.11 sec.
2025-11-14 16:59:00,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2024-07-09' --> 'data\processed_data\LLY\4_2024-07-09.md'
Converted 'data\edgar_documents\LLY\4_2024-07-11' --> 'data\processed_data\LLY\4_2024-07-11.md'


2025-11-14 16:59:01,004 - INFO - Going to convert document batch...
2025-11-14 16:59:01,005 - INFO - Processing document 4_2024-07-16
2025-11-14 16:59:01,030 - INFO - Finished converting document 4_2024-07-16 in 0.06 sec.
2025-11-14 16:59:01,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:01,170 - INFO - Going to convert document batch...
2025-11-14 16:59:01,171 - INFO - Processing document 4_2024-08-02
2025-11-14 16:59:01,197 - INFO - Finished converting document 4_2024-08-02 in 0.08 sec.
2025-11-14 16:59:01,244 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:59:01,244 - ERROR - Input document 4_2024-08-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\LLY\4_2024-07-16' --> 'data\processed_data\LLY\4_2024-07-16.md'
Converted 'data\edgar_documents\LLY\4_2024-08-02' --> 'data\processed_data\LLY\4_2024-08-02.md'
Error processing data\edgar_documents\LLY\4_2024-08-12: File format not allowed: data\edgar_documents\LLY\4_2024-08-12
Error processing data\edgar_documents\LLY\4_2024-08-13: File format not allowed: data\edgar_documents\LLY\4_2024-08-13


2025-11-14 16:59:01,302 - INFO - Going to convert document batch...
2025-11-14 16:59:01,303 - INFO - Processing document 4_2024-08-20
2025-11-14 16:59:01,329 - INFO - Finished converting document 4_2024-08-20 in 0.06 sec.
2025-11-14 16:59:01,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:01,383 - INFO - Going to convert document batch...
2025-11-14 16:59:01,384 - INFO - Processing document 4_2024-08-21
2025-11-14 16:59:01,415 - INFO - Finished converting document 4_2024-08-21 in 0.05 sec.
2025-11-14 16:59:01,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:01,475 - INFO - Going to convert document batch...
2025-11-14 16:59:01,476 - INFO - Processing document 4_2024-08-23
2025-11-14 16:59:01,503 - INFO - Finished converting document 4_2024-08-23 in 0.05 sec.


Converted 'data\edgar_documents\LLY\4_2024-08-20' --> 'data\processed_data\LLY\4_2024-08-20.md'
Converted 'data\edgar_documents\LLY\4_2024-08-21' --> 'data\processed_data\LLY\4_2024-08-21.md'
Converted 'data\edgar_documents\LLY\4_2024-08-23' --> 'data\processed_data\LLY\4_2024-08-23.md'


2025-11-14 16:59:01,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:01,556 - INFO - Going to convert document batch...
2025-11-14 16:59:01,557 - INFO - Processing document 4_2024-08-26
2025-11-14 16:59:01,592 - INFO - Finished converting document 4_2024-08-26 in 0.06 sec.
2025-11-14 16:59:01,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:01,657 - INFO - Going to convert document batch...
2025-11-14 16:59:01,657 - INFO - Processing document 4_2024-08-28
2025-11-14 16:59:01,685 - INFO - Finished converting document 4_2024-08-28 in 0.06 sec.
2025-11-14 16:59:01,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:01,733 - INFO - Going to convert document batch...
2025-11-14 16:59:01,734 - INFO - Processing document 4_2024-09-04
2025-11-14 16:59:01,761 - INFO - Finished converting document 4_2024-09-04 in 0.06 sec.
2025-11-14 16:59:01,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\LLY\4_2024-08-26' --> 'data\processed_data\LLY\4_2024-08-26.md'
Converted 'data\edgar_documents\LLY\4_2024-08-28' --> 'data\processed_data\LLY\4_2024-08-28.md'
Converted 'data\edgar_documents\LLY\4_2024-09-04' --> 'data\processed_data\LLY\4_2024-09-04.md'


2025-11-14 16:59:01,810 - INFO - Processing document 4_2024-09-12
2025-11-14 16:59:01,844 - INFO - Finished converting document 4_2024-09-12 in 0.06 sec.
2025-11-14 16:59:01,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:01,928 - INFO - Going to convert document batch...
2025-11-14 16:59:01,930 - INFO - Processing document 4_2024-09-17
2025-11-14 16:59:01,969 - INFO - Finished converting document 4_2024-09-17 in 0.08 sec.
2025-11-14 16:59:02,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:02,028 - INFO - Going to convert document batch...
2025-11-14 16:59:02,029 - INFO - Processing document 4_2024-10-22
2025-11-14 16:59:02,051 - INFO - Finished converting document 4_2024-10-22 in 0.05 sec.


Converted 'data\edgar_documents\LLY\4_2024-09-12' --> 'data\processed_data\LLY\4_2024-09-12.md'
Converted 'data\edgar_documents\LLY\4_2024-09-17' --> 'data\processed_data\LLY\4_2024-09-17.md'


2025-11-14 16:59:02,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:02,099 - INFO - Going to convert document batch...
2025-11-14 16:59:02,100 - INFO - Processing document 4_2024-11-01
2025-11-14 16:59:02,137 - INFO - Finished converting document 4_2024-11-01 in 0.06 sec.
2025-11-14 16:59:02,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:02,199 - INFO - Going to convert document batch...
2025-11-14 16:59:02,200 - INFO - Processing document 4_2024-11-05
2025-11-14 16:59:02,225 - INFO - Finished converting document 4_2024-11-05 in 0.05 sec.
2025-11-14 16:59:02,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2024-10-22' --> 'data\processed_data\LLY\4_2024-10-22.md'
Converted 'data\edgar_documents\LLY\4_2024-11-01' --> 'data\processed_data\LLY\4_2024-11-01.md'
Converted 'data\edgar_documents\LLY\4_2024-11-05' --> 'data\processed_data\LLY\4_2024-11-05.md'


2025-11-14 16:59:02,272 - INFO - Going to convert document batch...
2025-11-14 16:59:02,273 - INFO - Processing document 4_2024-11-08
2025-11-14 16:59:02,295 - INFO - Finished converting document 4_2024-11-08 in 0.05 sec.
2025-11-14 16:59:02,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:02,344 - INFO - Going to convert document batch...
2025-11-14 16:59:02,344 - INFO - Processing document 4_2024-11-20
2025-11-14 16:59:02,364 - INFO - Finished converting document 4_2024-11-20 in 0.05 sec.
2025-11-14 16:59:02,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:02,410 - INFO - Going to convert document batch...
2025-11-14 16:59:02,411 - INFO - Processing document 4_2024-12-17
2025-11-14 16:59:02,441 - INFO - Finished converting document 4_2024-12-17 in 0.05 sec.
2025-11-14 16:59:02,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:02,496 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\4_2024-11-08' --> 'data\processed_data\LLY\4_2024-11-08.md'
Converted 'data\edgar_documents\LLY\4_2024-11-20' --> 'data\processed_data\LLY\4_2024-11-20.md'
Converted 'data\edgar_documents\LLY\4_2024-12-17' --> 'data\processed_data\LLY\4_2024-12-17.md'


2025-11-14 16:59:02,497 - INFO - Processing document 4_2025-01-23
2025-11-14 16:59:02,530 - INFO - Finished converting document 4_2025-01-23 in 0.06 sec.
2025-11-14 16:59:02,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:02,583 - INFO - Going to convert document batch...
2025-11-14 16:59:02,584 - INFO - Processing document 4_2025-02-04
2025-11-14 16:59:02,624 - INFO - Finished converting document 4_2025-02-04 in 0.06 sec.
2025-11-14 16:59:02,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:02,700 - INFO - Going to convert document batch...
2025-11-14 16:59:02,702 - INFO - Processing document 4_2025-02-07
2025-11-14 16:59:02,748 - INFO - Finished converting document 4_2025-02-07 in 0.09 sec.


Converted 'data\edgar_documents\LLY\4_2025-01-23' --> 'data\processed_data\LLY\4_2025-01-23.md'
Converted 'data\edgar_documents\LLY\4_2025-02-04' --> 'data\processed_data\LLY\4_2025-02-04.md'


2025-11-14 16:59:02,820 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:59:02,821 - ERROR - Input document 4_2025-02-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:59:02,822 - INFO - Going to convert document batch...
2025-11-14 16:59:02,846 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:59:02,846 - ERROR - Input document 4_2025-02-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\LLY\4_2025-02-07' --> 'data\processed_data\LLY\4_2025-02-07.md'
Error processing data\edgar_documents\LLY\4_2025-02-10: File format not allowed: data\edgar_documents\LLY\4_2025-02-10
Error processing data\edgar_documents\LLY\4_2025-02-11: File format not allowed: data\edgar_documents\LLY\4_2025-02-11
Converted 'data\edgar_documents\LLY\4_2025-02-12' --> 'data\processed_data\LLY\4_2025-02-12.md'


2025-11-14 16:59:03,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:03,066 - INFO - Going to convert document batch...
2025-11-14 16:59:03,067 - INFO - Processing document 4_2025-02-19
2025-11-14 16:59:03,108 - INFO - Finished converting document 4_2025-02-19 in 0.08 sec.
2025-11-14 16:59:03,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:03,163 - INFO - Going to convert document batch...
2025-11-14 16:59:03,164 - INFO - Processing document 4_2025-02-20


Converted 'data\edgar_documents\LLY\4_2025-02-14' --> 'data\processed_data\LLY\4_2025-02-14.md'
Converted 'data\edgar_documents\LLY\4_2025-02-19' --> 'data\processed_data\LLY\4_2025-02-19.md'


2025-11-14 16:59:03,500 - INFO - Finished converting document 4_2025-02-20 in 0.36 sec.
2025-11-14 16:59:03,637 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:03,648 - INFO - Going to convert document batch...
2025-11-14 16:59:03,654 - INFO - Processing document 4_2025-02-21
2025-11-14 16:59:03,689 - INFO - Finished converting document 4_2025-02-21 in 0.14 sec.
2025-11-14 16:59:03,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2025-02-20' --> 'data\processed_data\LLY\4_2025-02-20.md'
Converted 'data\edgar_documents\LLY\4_2025-02-21' --> 'data\processed_data\LLY\4_2025-02-21.md'


2025-11-14 16:59:03,763 - INFO - Going to convert document batch...
2025-11-14 16:59:03,765 - INFO - Processing document 4_2025-02-24
2025-11-14 16:59:03,819 - INFO - Finished converting document 4_2025-02-24 in 0.11 sec.
2025-11-14 16:59:03,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:03,940 - INFO - Going to convert document batch...
2025-11-14 16:59:03,941 - INFO - Processing document 4_2025-02-25
2025-11-14 16:59:03,994 - INFO - Finished converting document 4_2025-02-25 in 0.14 sec.


Converted 'data\edgar_documents\LLY\4_2025-02-24' --> 'data\processed_data\LLY\4_2025-02-24.md'
Converted 'data\edgar_documents\LLY\4_2025-02-25' --> 'data\processed_data\LLY\4_2025-02-25.md'


2025-11-14 16:59:04,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:04,109 - INFO - Going to convert document batch...
2025-11-14 16:59:04,110 - INFO - Processing document 4_2025-02-26
2025-11-14 16:59:04,165 - INFO - Finished converting document 4_2025-02-26 in 0.12 sec.
2025-11-14 16:59:04,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:04,232 - INFO - Going to convert document batch...
2025-11-14 16:59:04,233 - INFO - Processing document 4_2025-03-03
2025-11-14 16:59:04,261 - INFO - Finished converting document 4_2025-03-03 in 0.06 sec.
2025-11-14 16:59:04,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:04,323 - INFO - Going to convert document batch...
2025-11-14 16:59:04,324 - INFO - Processing document 4_2025-03-04
2025-11-14 16:59:04,365 - INFO - Finished converting document 4_2025-03-04 in 0.08 sec.


Converted 'data\edgar_documents\LLY\4_2025-02-26' --> 'data\processed_data\LLY\4_2025-02-26.md'
Converted 'data\edgar_documents\LLY\4_2025-03-03' --> 'data\processed_data\LLY\4_2025-03-03.md'
Converted 'data\edgar_documents\LLY\4_2025-03-04' --> 'data\processed_data\LLY\4_2025-03-04.md'


2025-11-14 16:59:04,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:04,428 - INFO - Going to convert document batch...
2025-11-14 16:59:04,429 - INFO - Processing document 4_2025-03-13
2025-11-14 16:59:04,451 - INFO - Finished converting document 4_2025-03-13 in 0.06 sec.
2025-11-14 16:59:04,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:04,503 - INFO - Going to convert document batch...
2025-11-14 16:59:04,504 - INFO - Processing document 4_2025-03-19
2025-11-14 16:59:04,527 - INFO - Finished converting document 4_2025-03-19 in 0.05 sec.
2025-11-14 16:59:04,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2025-03-13' --> 'data\processed_data\LLY\4_2025-03-13.md'
Converted 'data\edgar_documents\LLY\4_2025-03-19' --> 'data\processed_data\LLY\4_2025-03-19.md'


2025-11-14 16:59:04,688 - INFO - Going to convert document batch...
2025-11-14 16:59:04,689 - INFO - Processing document 4_2025-04-22
2025-11-14 16:59:04,715 - INFO - Finished converting document 4_2025-04-22 in 0.09 sec.
2025-11-14 16:59:04,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:04,780 - INFO - Going to convert document batch...
2025-11-14 16:59:04,780 - INFO - Processing document 4_2025-05-05
2025-11-14 16:59:04,803 - INFO - Finished converting document 4_2025-05-05 in 0.06 sec.
2025-11-14 16:59:04,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:04,849 - INFO - Going to convert document batch...
2025-11-14 16:59:04,850 - INFO - Processing document 4_2025-05-15
2025-11-14 16:59:04,891 - INFO - Finished converting document 4_2025-05-15 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2025-04-22' --> 'data\processed_data\LLY\4_2025-04-22.md'
Converted 'data\edgar_documents\LLY\4_2025-05-05' --> 'data\processed_data\LLY\4_2025-05-05.md'
Converted 'data\edgar_documents\LLY\4_2025-05-15' --> 'data\processed_data\LLY\4_2025-05-15.md'


2025-11-14 16:59:04,932 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:04,941 - INFO - Going to convert document batch...
2025-11-14 16:59:04,942 - INFO - Processing document 4_2025-05-20
2025-11-14 16:59:04,964 - INFO - Finished converting document 4_2025-05-20 in 0.05 sec.
2025-11-14 16:59:05,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:05,019 - INFO - Going to convert document batch...
2025-11-14 16:59:05,020 - INFO - Processing document 4_2025-05-27
2025-11-14 16:59:05,041 - INFO - Finished converting document 4_2025-05-27 in 0.03 sec.
2025-11-14 16:59:05,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:05,084 - INFO - Going to convert document batch...
2025-11-14 16:59:05,085 - INFO - Processing document 4_2025-06-17
2025-11-14 16:59:05,106 - INFO - Finished converting document 4_2025-06-17 in 0.05 sec.
2025-11-14 16:59:05,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\LLY\4_2025-05-20' --> 'data\processed_data\LLY\4_2025-05-20.md'
Converted 'data\edgar_documents\LLY\4_2025-05-27' --> 'data\processed_data\LLY\4_2025-05-27.md'
Converted 'data\edgar_documents\LLY\4_2025-06-17' --> 'data\processed_data\LLY\4_2025-06-17.md'
Converted 'data\edgar_documents\LLY\4_2025-07-22' --> 'data\processed_data\LLY\4_2025-07-22.md'


2025-11-14 16:59:05,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:05,230 - INFO - Going to convert document batch...
2025-11-14 16:59:05,230 - INFO - Processing document 4_2025-07-25
2025-11-14 16:59:05,271 - INFO - Finished converting document 4_2025-07-25 in 0.08 sec.
2025-11-14 16:59:05,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:05,320 - INFO - Going to convert document batch...
2025-11-14 16:59:05,321 - INFO - Processing document 4_2025-08-04
2025-11-14 16:59:05,346 - INFO - Finished converting document 4_2025-08-04 in 0.05 sec.
2025-11-14 16:59:05,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:05,392 - INFO - Going to convert document batch...
2025-11-14 16:59:05,393 - INFO - Processing document 4_2025-08-08
2025-11-14 16:59:05,418 - INFO - Finished converting document 4_2025-08-08 in 0.05 sec.
2025-11-14 16:59:05,456 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:

Converted 'data\edgar_documents\LLY\4_2025-07-25' --> 'data\processed_data\LLY\4_2025-07-25.md'
Converted 'data\edgar_documents\LLY\4_2025-08-04' --> 'data\processed_data\LLY\4_2025-08-04.md'
Converted 'data\edgar_documents\LLY\4_2025-08-08' --> 'data\processed_data\LLY\4_2025-08-08.md'


2025-11-14 16:59:05,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:05,546 - INFO - Going to convert document batch...
2025-11-14 16:59:05,546 - INFO - Processing document 4_2025-08-13
2025-11-14 16:59:05,576 - INFO - Finished converting document 4_2025-08-13 in 0.06 sec.
2025-11-14 16:59:05,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:05,638 - INFO - Going to convert document batch...
2025-11-14 16:59:05,639 - INFO - Processing document 4_2025-08-14
2025-11-14 16:59:05,661 - INFO - Finished converting document 4_2025-08-14 in 0.05 sec.
2025-11-14 16:59:05,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\4_2025-08-12' --> 'data\processed_data\LLY\4_2025-08-12.md'
Converted 'data\edgar_documents\LLY\4_2025-08-13' --> 'data\processed_data\LLY\4_2025-08-13.md'
Converted 'data\edgar_documents\LLY\4_2025-08-14' --> 'data\processed_data\LLY\4_2025-08-14.md'


2025-11-14 16:59:05,711 - INFO - Going to convert document batch...
2025-11-14 16:59:05,712 - INFO - Processing document 4_2025-08-15
2025-11-14 16:59:05,731 - INFO - Finished converting document 4_2025-08-15 in 0.05 sec.
2025-11-14 16:59:05,781 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:59:05,782 - ERROR - Input document 4_2025-08-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:59:05,783 - INFO - Going to convert document batch...
2025-11-14 16:59:05,806 - IN

Converted 'data\edgar_documents\LLY\4_2025-08-15' --> 'data\processed_data\LLY\4_2025-08-15.md'
Error processing data\edgar_documents\LLY\4_2025-08-18: File format not allowed: data\edgar_documents\LLY\4_2025-08-18
Error processing data\edgar_documents\LLY\4_2025-08-19: File format not allowed: data\edgar_documents\LLY\4_2025-08-19
Converted 'data\edgar_documents\LLY\4_2025-08-28' --> 'data\processed_data\LLY\4_2025-08-28.md'


2025-11-14 16:59:05,948 - INFO - Finished converting document 4_2025-09-08 in 0.06 sec.
2025-11-14 16:59:06,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:06,122 - INFO - Going to convert document batch...
2025-11-14 16:59:06,123 - INFO - Processing document 4_2025-09-17
2025-11-14 16:59:06,145 - INFO - Finished converting document 4_2025-09-17 in 0.08 sec.
2025-11-14 16:59:06,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:06,192 - INFO - Going to convert document batch...
2025-11-14 16:59:06,194 - INFO - Processing document 4_2025-09-19
2025-11-14 16:59:06,223 - INFO - Finished converting document 4_2025-09-19 in 0.05 sec.


Converted 'data\edgar_documents\LLY\4_2025-09-08' --> 'data\processed_data\LLY\4_2025-09-08.md'
Converted 'data\edgar_documents\LLY\4_2025-09-17' --> 'data\processed_data\LLY\4_2025-09-17.md'


2025-11-14 16:59:06,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:06,270 - INFO - Going to convert document batch...
2025-11-14 16:59:06,271 - INFO - Processing document 4_2025-09-22
2025-11-14 16:59:06,297 - INFO - Finished converting document 4_2025-09-22 in 0.05 sec.
2025-11-14 16:59:06,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:06,362 - INFO - Going to convert document batch...
2025-11-14 16:59:06,362 - INFO - Processing document 4_2025-10-01
2025-11-14 16:59:06,388 - INFO - Finished converting document 4_2025-10-01 in 0.06 sec.
2025-11-14 16:59:06,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:06,448 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\4_2025-09-19' --> 'data\processed_data\LLY\4_2025-09-19.md'
Converted 'data\edgar_documents\LLY\4_2025-09-22' --> 'data\processed_data\LLY\4_2025-09-22.md'
Converted 'data\edgar_documents\LLY\4_2025-10-01' --> 'data\processed_data\LLY\4_2025-10-01.md'


2025-11-14 16:59:06,449 - INFO - Processing document 4_2025-10-02
2025-11-14 16:59:06,522 - INFO - Finished converting document 4_2025-10-02 in 0.11 sec.
2025-11-14 16:59:06,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:06,724 - INFO - Going to convert document batch...
2025-11-14 16:59:06,725 - INFO - Processing document 4_2025-10-03
2025-11-14 16:59:06,753 - INFO - Finished converting document 4_2025-10-03 in 0.09 sec.
2025-11-14 16:59:06,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:06,818 - INFO - Going to convert document batch...
2025-11-14 16:59:06,818 - INFO - Processing document 4_2025-10-06


Converted 'data\edgar_documents\LLY\4_2025-10-02' --> 'data\processed_data\LLY\4_2025-10-02.md'
Converted 'data\edgar_documents\LLY\4_2025-10-03' --> 'data\processed_data\LLY\4_2025-10-03.md'


2025-11-14 16:59:06,872 - INFO - Finished converting document 4_2025-10-06 in 0.09 sec.
2025-11-14 16:59:06,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:06,958 - INFO - Going to convert document batch...
2025-11-14 16:59:06,959 - INFO - Processing document 4_2025-10-07
2025-11-14 16:59:06,993 - INFO - Finished converting document 4_2025-10-07 in 0.06 sec.
2025-11-14 16:59:07,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:07,043 - INFO - Going to convert document batch...
2025-11-14 16:59:07,044 - INFO - Processing document 4_2025-10-08
2025-11-14 16:59:07,062 - INFO - Finished converting document 4_2025-10-08 in 0.05 sec.


Converted 'data\edgar_documents\LLY\4_2025-10-06' --> 'data\processed_data\LLY\4_2025-10-06.md'
Converted 'data\edgar_documents\LLY\4_2025-10-07' --> 'data\processed_data\LLY\4_2025-10-07.md'
Converted 'data\edgar_documents\LLY\4_2025-10-08' --> 'data\processed_data\LLY\4_2025-10-08.md'


2025-11-14 16:59:07,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:07,127 - INFO - Going to convert document batch...
2025-11-14 16:59:07,128 - INFO - Processing document 4_2025-10-09
2025-11-14 16:59:07,172 - INFO - Finished converting document 4_2025-10-09 in 0.09 sec.
2025-11-14 16:59:07,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:07,274 - INFO - Going to convert document batch...
2025-11-14 16:59:07,275 - INFO - Processing document 4_2025-10-10
2025-11-14 16:59:07,306 - INFO - Finished converting document 4_2025-10-10 in 0.09 sec.
2025-11-14 16:59:07,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:07,358 - INFO - Going to convert document batch...
2025-11-14 16:59:07,359 - INFO - Processing document 4_2025-10-14
2025-11-14 16:59:07,381 - INFO - Finished converting document 4_2025-10-14 in 0.05 sec.


Converted 'data\edgar_documents\LLY\4_2025-10-09' --> 'data\processed_data\LLY\4_2025-10-09.md'
Converted 'data\edgar_documents\LLY\4_2025-10-10' --> 'data\processed_data\LLY\4_2025-10-10.md'
Converted 'data\edgar_documents\LLY\4_2025-10-14' --> 'data\processed_data\LLY\4_2025-10-14.md'


2025-11-14 16:59:07,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:07,427 - INFO - Going to convert document batch...
2025-11-14 16:59:07,428 - INFO - Processing document 4_2025-10-22
2025-11-14 16:59:07,448 - INFO - Finished converting document 4_2025-10-22 in 0.05 sec.
2025-11-14 16:59:07,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:07,624 - INFO - Going to convert document batch...
2025-11-14 16:59:07,625 - INFO - Processing document 4_2025-11-03
2025-11-14 16:59:07,656 - INFO - Finished converting document 4_2025-11-03 in 0.06 sec.
2025-11-14 16:59:07,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:07,761 - INFO - Going to convert document batch...
2025-11-14 16:59:07,762 - INFO - Processing document 4_2025-11-04


Converted 'data\edgar_documents\LLY\4_2025-10-22' --> 'data\processed_data\LLY\4_2025-10-22.md'
Converted 'data\edgar_documents\LLY\4_2025-11-03' --> 'data\processed_data\LLY\4_2025-11-03.md'


2025-11-14 16:59:07,820 - INFO - Finished converting document 4_2025-11-04 in 0.12 sec.
2025-11-14 16:59:07,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:07,912 - INFO - Going to convert document batch...
2025-11-14 16:59:07,913 - INFO - Processing document 4_2025-11-05
2025-11-14 16:59:07,949 - INFO - Finished converting document 4_2025-11-05 in 0.08 sec.
2025-11-14 16:59:07,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:07,998 - INFO - Going to convert document batch...
2025-11-14 16:59:07,999 - INFO - Processing document 4_2025-11-06
2025-11-14 16:59:08,033 - INFO - Finished converting document 4_2025-11-06 in 0.06 sec.


Converted 'data\edgar_documents\LLY\4_2025-11-04' --> 'data\processed_data\LLY\4_2025-11-04.md'
Converted 'data\edgar_documents\LLY\4_2025-11-05' --> 'data\processed_data\LLY\4_2025-11-05.md'


2025-11-14 16:59:08,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:08,089 - INFO - Going to convert document batch...
2025-11-14 16:59:08,090 - INFO - Processing document 4_2025-11-10
2025-11-14 16:59:08,137 - INFO - Finished converting document 4_2025-11-10 in 0.08 sec.
2025-11-14 16:59:08,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:08,211 - INFO - Going to convert document batch...
2025-11-14 16:59:08,212 - INFO - Processing document 8-K_2023-02-02


Converted 'data\edgar_documents\LLY\4_2025-11-06' --> 'data\processed_data\LLY\4_2025-11-06.md'
Converted 'data\edgar_documents\LLY\4_2025-11-10' --> 'data\processed_data\LLY\4_2025-11-10.md'


2025-11-14 16:59:08,322 - INFO - Finished converting document 8-K_2023-02-02 in 0.16 sec.
2025-11-14 16:59:08,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:08,437 - INFO - Going to convert document batch...
2025-11-14 16:59:08,438 - INFO - Processing document 8-K_2023-02-24


Converted 'data\edgar_documents\LLY\8-K_2023-02-02' --> 'data\processed_data\LLY\8-K_2023-02-02.md'


2025-11-14 16:59:08,774 - INFO - Finished converting document 8-K_2023-02-24 in 0.41 sec.
2025-11-14 16:59:08,820 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:08,953 - INFO - Going to convert document batch...
2025-11-14 16:59:08,954 - INFO - Processing document 8-K_2023-03-17
2025-11-14 16:59:08,989 - INFO - Finished converting document 8-K_2023-03-17 in 0.19 sec.


Converted 'data\edgar_documents\LLY\8-K_2023-02-24' --> 'data\processed_data\LLY\8-K_2023-02-24.md'


2025-11-14 16:59:09,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:09,078 - INFO - Going to convert document batch...
2025-11-14 16:59:09,080 - INFO - Processing document 8-K_2023-04-27
2025-11-14 16:59:09,131 - INFO - Finished converting document 8-K_2023-04-27 in 0.09 sec.
2025-11-14 16:59:09,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:09,219 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\8-K_2023-03-17' --> 'data\processed_data\LLY\8-K_2023-03-17.md'
Converted 'data\edgar_documents\LLY\8-K_2023-04-27' --> 'data\processed_data\LLY\8-K_2023-04-27.md'


2025-11-14 16:59:09,219 - INFO - Processing document 8-K_2023-05-04
2025-11-14 16:59:09,288 - INFO - Finished converting document 8-K_2023-05-04 in 0.14 sec.
2025-11-14 16:59:09,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:09,413 - INFO - Going to convert document batch...
2025-11-14 16:59:09,414 - INFO - Processing document 8-K_2023-08-08
2025-11-14 16:59:09,456 - INFO - Finished converting document 8-K_2023-08-08 in 0.14 sec.


Converted 'data\edgar_documents\LLY\8-K_2023-05-04' --> 'data\processed_data\LLY\8-K_2023-05-04.md'
Converted 'data\edgar_documents\LLY\8-K_2023-08-08' --> 'data\processed_data\LLY\8-K_2023-08-08.md'


2025-11-14 16:59:09,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:09,545 - INFO - Going to convert document batch...
2025-11-14 16:59:09,546 - INFO - Processing document 8-K_2023-11-02
2025-11-14 16:59:09,616 - INFO - Finished converting document 8-K_2023-11-02 in 0.14 sec.
2025-11-14 16:59:09,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:09,704 - INFO - Going to convert document batch...
2025-11-14 16:59:09,705 - INFO - Processing document 8-K_2024-02-06
2025-11-14 16:59:09,750 - INFO - Finished converting document 8-K_2024-02-06 in 0.11 sec.
2025-11-14 16:59:09,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:09,812 - INFO - Going to convert document batch...
2025-11-14 16:59:09,814 - INFO - Processing document 8-K_2024-02-09


Converted 'data\edgar_documents\LLY\8-K_2023-11-02' --> 'data\processed_data\LLY\8-K_2023-11-02.md'
Converted 'data\edgar_documents\LLY\8-K_2024-02-06' --> 'data\processed_data\LLY\8-K_2024-02-06.md'


2025-11-14 16:59:09,852 - INFO - Finished converting document 8-K_2024-02-09 in 0.08 sec.
2025-11-14 16:59:09,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:09,925 - INFO - Going to convert document batch...
2025-11-14 16:59:09,925 - INFO - Processing document 8-K_2024-04-30
2025-11-14 16:59:09,989 - INFO - Finished converting document 8-K_2024-04-30 in 0.11 sec.
2025-11-14 16:59:10,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\8-K_2024-02-09' --> 'data\processed_data\LLY\8-K_2024-02-09.md'
Converted 'data\edgar_documents\LLY\8-K_2024-04-30' --> 'data\processed_data\LLY\8-K_2024-04-30.md'


2025-11-14 16:59:10,106 - INFO - Going to convert document batch...
2025-11-14 16:59:10,107 - INFO - Processing document 8-K_2024-05-09
2025-11-14 16:59:10,184 - INFO - Finished converting document 8-K_2024-05-09 in 0.19 sec.
2025-11-14 16:59:10,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:10,303 - INFO - Going to convert document batch...
2025-11-14 16:59:10,304 - INFO - Processing document 8-K_2024-06-05
2025-11-14 16:59:10,339 - INFO - Finished converting document 8-K_2024-06-05 in 0.12 sec.
2025-11-14 16:59:10,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:10,392 - INFO - Going to convert document batch...
2025-11-14 16:59:10,393 - INFO - Processing document 8-K_2024-07-10


Converted 'data\edgar_documents\LLY\8-K_2024-05-09' --> 'data\processed_data\LLY\8-K_2024-05-09.md'
Converted 'data\edgar_documents\LLY\8-K_2024-06-05' --> 'data\processed_data\LLY\8-K_2024-06-05.md'


2025-11-14 16:59:10,436 - INFO - Finished converting document 8-K_2024-07-10 in 0.08 sec.
2025-11-14 16:59:10,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:10,497 - INFO - Going to convert document batch...
2025-11-14 16:59:10,499 - INFO - Processing document 8-K_2024-08-08
2025-11-14 16:59:10,544 - INFO - Finished converting document 8-K_2024-08-08 in 0.09 sec.
2025-11-14 16:59:10,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:10,600 - INFO - Going to convert document batch...
2025-11-14 16:59:10,601 - INFO - Processing document 8-K_2024-08-14
2025-11-14 16:59:10,635 - INFO - Finished converting document 8-K_2024-08-14 in 0.08 sec.


Converted 'data\edgar_documents\LLY\8-K_2024-07-10' --> 'data\processed_data\LLY\8-K_2024-07-10.md'
Converted 'data\edgar_documents\LLY\8-K_2024-08-08' --> 'data\processed_data\LLY\8-K_2024-08-08.md'


2025-11-14 16:59:10,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:10,699 - INFO - Going to convert document batch...
2025-11-14 16:59:10,702 - INFO - Processing document 8-K_2024-08-16
2025-11-14 16:59:10,748 - INFO - Finished converting document 8-K_2024-08-16 in 0.09 sec.
2025-11-14 16:59:10,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:10,852 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\8-K_2024-08-14' --> 'data\processed_data\LLY\8-K_2024-08-14.md'
Converted 'data\edgar_documents\LLY\8-K_2024-08-16' --> 'data\processed_data\LLY\8-K_2024-08-16.md'


2025-11-14 16:59:10,853 - INFO - Processing document 8-K_2024-09-09
2025-11-14 16:59:10,893 - INFO - Finished converting document 8-K_2024-09-09 in 0.12 sec.
2025-11-14 16:59:10,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:10,982 - INFO - Going to convert document batch...
2025-11-14 16:59:10,983 - INFO - Processing document 8-K_2024-10-30
2025-11-14 16:59:11,035 - INFO - Finished converting document 8-K_2024-10-30 in 0.11 sec.
2025-11-14 16:59:11,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:11,106 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\8-K_2024-09-09' --> 'data\processed_data\LLY\8-K_2024-09-09.md'
Converted 'data\edgar_documents\LLY\8-K_2024-10-30' --> 'data\processed_data\LLY\8-K_2024-10-30.md'


2025-11-14 16:59:11,107 - INFO - Processing document 8-K_2024-11-19
2025-11-14 16:59:11,158 - INFO - Finished converting document 8-K_2024-11-19 in 0.11 sec.
2025-11-14 16:59:11,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:11,266 - INFO - Going to convert document batch...
2025-11-14 16:59:11,267 - INFO - Processing document 8-K_2025-01-14
2025-11-14 16:59:11,311 - INFO - Finished converting document 8-K_2025-01-14 in 0.12 sec.
2025-11-14 16:59:11,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\8-K_2024-11-19' --> 'data\processed_data\LLY\8-K_2024-11-19.md'
Converted 'data\edgar_documents\LLY\8-K_2025-01-14' --> 'data\processed_data\LLY\8-K_2025-01-14.md'


2025-11-14 16:59:11,418 - INFO - Going to convert document batch...
2025-11-14 16:59:11,419 - INFO - Processing document 8-K_2025-02-06
2025-11-14 16:59:11,485 - INFO - Finished converting document 8-K_2025-02-06 in 0.16 sec.
2025-11-14 16:59:11,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:11,568 - INFO - Going to convert document batch...
2025-11-14 16:59:11,569 - INFO - Processing document 8-K_2025-02-12
2025-11-14 16:59:11,599 - INFO - Finished converting document 8-K_2025-02-12 in 0.09 sec.
2025-11-14 16:59:11,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\8-K_2025-02-06' --> 'data\processed_data\LLY\8-K_2025-02-06.md'
Converted 'data\edgar_documents\LLY\8-K_2025-02-12' --> 'data\processed_data\LLY\8-K_2025-02-12.md'


2025-11-14 16:59:11,726 - INFO - Going to convert document batch...
2025-11-14 16:59:11,728 - INFO - Processing document 8-K_2025-05-01
2025-11-14 16:59:11,783 - INFO - Finished converting document 8-K_2025-05-01 in 0.17 sec.
2025-11-14 16:59:11,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:11,904 - INFO - Going to convert document batch...
2025-11-14 16:59:11,906 - INFO - Processing document 8-K_2025-05-08
2025-11-14 16:59:11,949 - INFO - Finished converting document 8-K_2025-05-08 in 0.11 sec.
2025-11-14 16:59:11,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:12,005 - INFO - Going to convert document batch...
2025-11-14 16:59:12,006 - INFO - Processing document 8-K_2025-08-07
2025-11-14 16:59:12,044 - INFO - Finished converting document 8-K_2025-08-07 in 0.08 sec.


Converted 'data\edgar_documents\LLY\8-K_2025-05-01' --> 'data\processed_data\LLY\8-K_2025-05-01.md'
Converted 'data\edgar_documents\LLY\8-K_2025-05-08' --> 'data\processed_data\LLY\8-K_2025-05-08.md'


2025-11-14 16:59:12,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:12,113 - INFO - Going to convert document batch...
2025-11-14 16:59:12,114 - INFO - Processing document 8-K_2025-08-20
2025-11-14 16:59:12,157 - INFO - Finished converting document 8-K_2025-08-20 in 0.09 sec.
2025-11-14 16:59:12,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:12,248 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LLY\8-K_2025-08-07' --> 'data\processed_data\LLY\8-K_2025-08-07.md'
Converted 'data\edgar_documents\LLY\8-K_2025-08-20' --> 'data\processed_data\LLY\8-K_2025-08-20.md'


2025-11-14 16:59:12,250 - INFO - Processing document 8-K_2025-10-30
2025-11-14 16:59:12,285 - INFO - Finished converting document 8-K_2025-10-30 in 0.11 sec.
2025-11-14 16:59:12,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\8-K_2025-10-30' --> 'data\processed_data\LLY\8-K_2025-10-30.md'


2025-11-14 16:59:13,201 - INFO - Going to convert document batch...
2025-11-14 16:59:13,202 - INFO - Processing document DEF-14A_2023-03-17
2025-11-14 16:59:15,767 - INFO - Finished converting document DEF-14A_2023-03-17 in 3.45 sec.
2025-11-14 16:59:16,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\DEF-14A_2023-03-17' --> 'data\processed_data\LLY\DEF-14A_2023-03-17.md'


2025-11-14 16:59:17,548 - INFO - Going to convert document batch...
2025-11-14 16:59:17,549 - INFO - Processing document DEF-14A_2024-03-22
2025-11-14 16:59:20,719 - INFO - Finished converting document DEF-14A_2024-03-22 in 4.06 sec.
2025-11-14 16:59:22,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\DEF-14A_2024-03-22' --> 'data\processed_data\LLY\DEF-14A_2024-03-22.md'


2025-11-14 16:59:22,785 - INFO - Going to convert document batch...
2025-11-14 16:59:22,786 - INFO - Processing document DEF-14A_2025-03-21
2025-11-14 16:59:26,410 - INFO - Finished converting document DEF-14A_2025-03-21 in 4.28 sec.
2025-11-14 16:59:27,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LLY\DEF-14A_2025-03-21' --> 'data\processed_data\LLY\DEF-14A_2025-03-21.md'
Processed 206 new files. Errors: 10
Found 94 files to process in data\edgar_documents\LMT


2025-11-14 16:59:28,890 - INFO - Going to convert document batch...
2025-11-14 16:59:28,891 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:59:28,892 - INFO - Processing document 10-K_2023-01-26
2025-11-14 16:59:31,580 - INFO - Finished converting document 10-K_2023-01-26 in 4.05 sec.
2025-11-14 16:59:32,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-K_2023-01-26' --> 'data\processed_data\LMT\10-K_2023-01-26.md'


2025-11-14 16:59:33,546 - INFO - Going to convert document batch...
2025-11-14 16:59:33,547 - INFO - Processing document 10-K_2024-01-23
2025-11-14 16:59:35,548 - INFO - Finished converting document 10-K_2024-01-23 in 2.98 sec.
2025-11-14 16:59:36,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-K_2024-01-23' --> 'data\processed_data\LMT\10-K_2024-01-23.md'


2025-11-14 16:59:37,315 - INFO - Going to convert document batch...
2025-11-14 16:59:37,316 - INFO - Processing document 10-K_2025-01-28
2025-11-14 16:59:39,258 - INFO - Finished converting document 10-K_2025-01-28 in 3.11 sec.
2025-11-14 16:59:39,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-K_2025-01-28' --> 'data\processed_data\LMT\10-K_2025-01-28.md'


2025-11-14 16:59:40,809 - INFO - Going to convert document batch...
2025-11-14 16:59:40,810 - INFO - Processing document 10-Q_2023-04-18
2025-11-14 16:59:41,584 - INFO - Finished converting document 10-Q_2023-04-18 in 1.73 sec.
2025-11-14 16:59:42,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-Q_2023-04-18' --> 'data\processed_data\LMT\10-Q_2023-04-18.md'


2025-11-14 16:59:42,599 - INFO - Going to convert document batch...
2025-11-14 16:59:42,600 - INFO - Processing document 10-Q_2023-07-19
2025-11-14 16:59:43,428 - INFO - Finished converting document 10-Q_2023-07-19 in 1.47 sec.
2025-11-14 16:59:43,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-Q_2023-07-19' --> 'data\processed_data\LMT\10-Q_2023-07-19.md'


2025-11-14 16:59:44,717 - INFO - Going to convert document batch...
2025-11-14 16:59:44,718 - INFO - Processing document 10-Q_2023-10-17
2025-11-14 16:59:45,547 - INFO - Finished converting document 10-Q_2023-10-17 in 1.72 sec.
2025-11-14 16:59:46,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-Q_2023-10-17' --> 'data\processed_data\LMT\10-Q_2023-10-17.md'


2025-11-14 16:59:46,465 - INFO - Going to convert document batch...
2025-11-14 16:59:46,466 - INFO - Processing document 10-Q_2024-04-23
2025-11-14 16:59:47,130 - INFO - Finished converting document 10-Q_2024-04-23 in 1.09 sec.
2025-11-14 16:59:47,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-Q_2024-04-23' --> 'data\processed_data\LMT\10-Q_2024-04-23.md'


2025-11-14 16:59:48,205 - INFO - Going to convert document batch...
2025-11-14 16:59:48,206 - INFO - Processing document 10-Q_2024-07-23
2025-11-14 16:59:49,010 - INFO - Finished converting document 10-Q_2024-07-23 in 1.58 sec.
2025-11-14 16:59:49,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-Q_2024-07-23' --> 'data\processed_data\LMT\10-Q_2024-07-23.md'


2025-11-14 16:59:50,307 - INFO - Going to convert document batch...
2025-11-14 16:59:50,307 - INFO - Processing document 10-Q_2024-10-22
2025-11-14 16:59:51,227 - INFO - Finished converting document 10-Q_2024-10-22 in 1.86 sec.
2025-11-14 16:59:51,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-Q_2024-10-22' --> 'data\processed_data\LMT\10-Q_2024-10-22.md'


2025-11-14 16:59:52,031 - INFO - Going to convert document batch...
2025-11-14 16:59:52,032 - INFO - Processing document 10-Q_2025-04-22
2025-11-14 16:59:52,860 - INFO - Finished converting document 10-Q_2025-04-22 in 1.25 sec.
2025-11-14 16:59:53,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-Q_2025-04-22' --> 'data\processed_data\LMT\10-Q_2025-04-22.md'


2025-11-14 16:59:54,181 - INFO - Going to convert document batch...
2025-11-14 16:59:54,183 - INFO - Processing document 10-Q_2025-07-22
2025-11-14 16:59:55,013 - INFO - Finished converting document 10-Q_2025-07-22 in 1.83 sec.
2025-11-14 16:59:55,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\10-Q_2025-07-22' --> 'data\processed_data\LMT\10-Q_2025-07-22.md'


2025-11-14 16:59:56,044 - INFO - Going to convert document batch...
2025-11-14 16:59:56,046 - INFO - Processing document 10-Q_2025-10-21
2025-11-14 16:59:57,087 - INFO - Finished converting document 10-Q_2025-10-21 in 1.69 sec.
2025-11-14 16:59:57,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:57,673 - INFO - Going to convert document batch...
2025-11-14 16:59:57,674 - INFO - Processing document 4_2023-01-04
2025-11-14 16:59:57,699 - INFO - Finished converting document 4_2023-01-04 in 0.06 sec.
2025-11-14 16:59:57,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:57,746 - INFO - Going to convert document batch...
2025-11-14 16:59:57,747 - INFO - Processing document 4_2023-01-26


Converted 'data\edgar_documents\LMT\10-Q_2025-10-21' --> 'data\processed_data\LMT\10-Q_2025-10-21.md'
Converted 'data\edgar_documents\LMT\4_2023-01-04' --> 'data\processed_data\LMT\4_2023-01-04.md'


2025-11-14 16:59:58,205 - INFO - Finished converting document 4_2023-01-26 in 0.48 sec.
2025-11-14 16:59:58,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:58,276 - INFO - Going to convert document batch...
2025-11-14 16:59:58,276 - INFO - Processing document 4_2023-02-17
2025-11-14 16:59:58,307 - INFO - Finished converting document 4_2023-02-17 in 0.05 sec.
2025-11-14 16:59:58,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:58,352 - INFO - Going to convert document batch...
2025-11-14 16:59:58,353 - INFO - Processing document 4_2023-02-24
2025-11-14 16:59:58,374 - INFO - Finished converting document 4_2023-02-24 in 0.05 sec.
2025-11-14 16:59:58,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:58,421 - INFO - Going to convert document batch...
2025-11-14 16:59:58,422 - INFO - Processing document 4_2023-02-27


Converted 'data\edgar_documents\LMT\4_2023-01-26' --> 'data\processed_data\LMT\4_2023-01-26.md'
Converted 'data\edgar_documents\LMT\4_2023-02-17' --> 'data\processed_data\LMT\4_2023-02-17.md'
Converted 'data\edgar_documents\LMT\4_2023-02-24' --> 'data\processed_data\LMT\4_2023-02-24.md'


2025-11-14 16:59:58,448 - INFO - Finished converting document 4_2023-02-27 in 0.06 sec.
2025-11-14 16:59:58,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:58,507 - INFO - Going to convert document batch...
2025-11-14 16:59:58,509 - INFO - Processing document 4_2023-03-01
2025-11-14 16:59:58,536 - INFO - Finished converting document 4_2023-03-01 in 0.06 sec.
2025-11-14 16:59:58,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:58,583 - INFO - Going to convert document batch...
2025-11-14 16:59:58,584 - INFO - Processing document 4_2023-03-03
2025-11-14 16:59:58,614 - INFO - Finished converting document 4_2023-03-03 in 0.05 sec.
2025-11-14 16:59:58,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\4_2023-02-27' --> 'data\processed_data\LMT\4_2023-02-27.md'
Converted 'data\edgar_documents\LMT\4_2023-03-01' --> 'data\processed_data\LMT\4_2023-03-01.md'
Converted 'data\edgar_documents\LMT\4_2023-03-03' --> 'data\processed_data\LMT\4_2023-03-03.md'


2025-11-14 16:59:58,679 - INFO - Going to convert document batch...
2025-11-14 16:59:58,680 - INFO - Processing document 4_2023-03-07
2025-11-14 16:59:58,721 - INFO - Finished converting document 4_2023-03-07 in 0.08 sec.
2025-11-14 16:59:58,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:58,767 - INFO - Going to convert document batch...
2025-11-14 16:59:58,768 - INFO - Processing document 4_2023-04-04
2025-11-14 16:59:58,792 - INFO - Finished converting document 4_2023-04-04 in 0.06 sec.
2025-11-14 16:59:58,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:58,855 - INFO - Going to convert document batch...
2025-11-14 16:59:58,856 - INFO - Processing document 4_2023-04-20
2025-11-14 16:59:58,876 - INFO - Finished converting document 4_2023-04-20 in 0.06 sec.


Converted 'data\edgar_documents\LMT\4_2023-03-07' --> 'data\processed_data\LMT\4_2023-03-07.md'
Converted 'data\edgar_documents\LMT\4_2023-04-04' --> 'data\processed_data\LMT\4_2023-04-04.md'
Converted 'data\edgar_documents\LMT\4_2023-04-20' --> 'data\processed_data\LMT\4_2023-04-20.md'


2025-11-14 16:59:58,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:58,956 - INFO - Going to convert document batch...
2025-11-14 16:59:58,957 - INFO - Processing document 4_2023-04-21
2025-11-14 16:59:58,991 - INFO - Finished converting document 4_2023-04-21 in 0.06 sec.
2025-11-14 16:59:59,151 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:59:59,152 - ERROR - Input document 4_2023-05-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:59

Converted 'data\edgar_documents\LMT\4_2023-04-21' --> 'data\processed_data\LMT\4_2023-04-21.md'
Error processing data\edgar_documents\LMT\4_2023-05-23: File format not allowed: data\edgar_documents\LMT\4_2023-05-23
Error processing data\edgar_documents\LMT\4_2023-05-24: File format not allowed: data\edgar_documents\LMT\4_2023-05-24
Converted 'data\edgar_documents\LMT\4_2023-07-05' --> 'data\processed_data\LMT\4_2023-07-05.md'


2025-11-14 16:59:59,284 - INFO - Processing document 4_2023-07-19
2025-11-14 16:59:59,304 - INFO - Finished converting document 4_2023-07-19 in 0.05 sec.
2025-11-14 16:59:59,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:59,361 - INFO - Going to convert document batch...
2025-11-14 16:59:59,362 - INFO - Processing document 4_2023-07-31
2025-11-14 16:59:59,395 - INFO - Finished converting document 4_2023-07-31 in 0.06 sec.
2025-11-14 16:59:59,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:59,457 - INFO - Going to convert document batch...
2025-11-14 16:59:59,457 - INFO - Processing document 4_2023-10-03
2025-11-14 16:59:59,481 - INFO - Finished converting document 4_2023-10-03 in 0.06 sec.
2025-11-14 16:59:59,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\4_2023-07-19' --> 'data\processed_data\LMT\4_2023-07-19.md'
Converted 'data\edgar_documents\LMT\4_2023-07-31' --> 'data\processed_data\LMT\4_2023-07-31.md'
Converted 'data\edgar_documents\LMT\4_2023-10-03' --> 'data\processed_data\LMT\4_2023-10-03.md'


2025-11-14 16:59:59,535 - INFO - Going to convert document batch...
2025-11-14 16:59:59,535 - INFO - Processing document 4_2023-12-12
2025-11-14 16:59:59,581 - INFO - Finished converting document 4_2023-12-12 in 0.08 sec.
2025-11-14 16:59:59,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:59,722 - INFO - Going to convert document batch...
2025-11-14 16:59:59,723 - INFO - Processing document 4_2024-01-03
2025-11-14 16:59:59,747 - INFO - Finished converting document 4_2024-01-03 in 0.06 sec.
2025-11-14 16:59:59,797 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:59:59,799 - ERROR - Input document 4_2024-01-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\LMT\4_2023-12-12' --> 'data\processed_data\LMT\4_2023-12-12.md'
Converted 'data\edgar_documents\LMT\4_2024-01-03' --> 'data\processed_data\LMT\4_2024-01-03.md'
Error processing data\edgar_documents\LMT\4_2024-01-25: File format not allowed: data\edgar_documents\LMT\4_2024-01-25
Error processing data\edgar_documents\LMT\4_2024-01-26: File format not allowed: data\edgar_documents\LMT\4_2024-01-26


2025-11-14 16:59:59,876 - INFO - Processing document 4_2024-02-20
2025-11-14 16:59:59,911 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.
2025-11-14 16:59:59,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:59:59,961 - INFO - Going to convert document batch...
2025-11-14 16:59:59,962 - INFO - Processing document 4_2024-02-26
2025-11-14 16:59:59,984 - INFO - Finished converting document 4_2024-02-26 in 0.05 sec.
2025-11-14 17:00:00,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,037 - INFO - Going to convert document batch...
2025-11-14 17:00:00,038 - INFO - Processing document 4_2024-02-27
2025-11-14 17:00:00,064 - INFO - Finished converting document 4_2024-02-27 in 0.06 sec.
2025-11-14 17:00:00,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,108 - INFO - Going to convert document batch...
2025-11-14 17:00:00,109 - INFO - Processing document 4_2024-03-05


Converted 'data\edgar_documents\LMT\4_2024-02-20' --> 'data\processed_data\LMT\4_2024-02-20.md'
Converted 'data\edgar_documents\LMT\4_2024-02-26' --> 'data\processed_data\LMT\4_2024-02-26.md'
Converted 'data\edgar_documents\LMT\4_2024-02-27' --> 'data\processed_data\LMT\4_2024-02-27.md'


2025-11-14 17:00:00,132 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 17:00:00,167 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,183 - INFO - Going to convert document batch...
2025-11-14 17:00:00,184 - INFO - Processing document 4_2024-03-07
2025-11-14 17:00:00,216 - INFO - Finished converting document 4_2024-03-07 in 0.06 sec.
2025-11-14 17:00:00,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,278 - INFO - Going to convert document batch...
2025-11-14 17:00:00,278 - INFO - Processing document 4_2024-04-02
2025-11-14 17:00:00,300 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 17:00:00,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,345 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LMT\4_2024-03-05' --> 'data\processed_data\LMT\4_2024-03-05.md'
Converted 'data\edgar_documents\LMT\4_2024-03-07' --> 'data\processed_data\LMT\4_2024-03-07.md'
Converted 'data\edgar_documents\LMT\4_2024-04-02' --> 'data\processed_data\LMT\4_2024-04-02.md'


2025-11-14 17:00:00,345 - INFO - Processing document 4_2024-04-03
2025-11-14 17:00:00,374 - INFO - Finished converting document 4_2024-04-03 in 0.05 sec.
2025-11-14 17:00:00,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,426 - INFO - Going to convert document batch...
2025-11-14 17:00:00,426 - INFO - Processing document 4_2024-04-29
2025-11-14 17:00:00,451 - INFO - Finished converting document 4_2024-04-29 in 0.05 sec.
2025-11-14 17:00:00,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,498 - INFO - Going to convert document batch...
2025-11-14 17:00:00,499 - INFO - Processing document 4_2024-06-05
2025-11-14 17:00:00,530 - INFO - Finished converting document 4_2024-06-05 in 0.06 sec.
2025-11-14 17:00:00,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,579 - INFO - Going to convert document batch...
2025-11-14 17:00:00,580 - INFO - Processing document 4_2024-07-02


Converted 'data\edgar_documents\LMT\4_2024-04-03' --> 'data\processed_data\LMT\4_2024-04-03.md'
Converted 'data\edgar_documents\LMT\4_2024-04-29' --> 'data\processed_data\LMT\4_2024-04-29.md'
Converted 'data\edgar_documents\LMT\4_2024-06-05' --> 'data\processed_data\LMT\4_2024-06-05.md'


2025-11-14 17:00:00,608 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.
2025-11-14 17:00:00,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,681 - INFO - Going to convert document batch...
2025-11-14 17:00:00,720 - INFO - Processing document 4_2024-07-25
2025-11-14 17:00:00,800 - INFO - Finished converting document 4_2024-07-25 in 0.16 sec.


Converted 'data\edgar_documents\LMT\4_2024-07-02' --> 'data\processed_data\LMT\4_2024-07-02.md'


2025-11-14 17:00:00,843 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,858 - INFO - Going to convert document batch...
2025-11-14 17:00:00,859 - INFO - Processing document 4_2024-08-05
2025-11-14 17:00:00,900 - INFO - Finished converting document 4_2024-08-05 in 0.06 sec.
2025-11-14 17:00:00,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:00,969 - INFO - Going to convert document batch...
2025-11-14 17:00:00,970 - INFO - Processing document 4_2024-10-02
2025-11-14 17:00:00,994 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.
2025-11-14 17:00:01,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\4_2024-07-25' --> 'data\processed_data\LMT\4_2024-07-25.md'
Converted 'data\edgar_documents\LMT\4_2024-08-05' --> 'data\processed_data\LMT\4_2024-08-05.md'
Converted 'data\edgar_documents\LMT\4_2024-10-02' --> 'data\processed_data\LMT\4_2024-10-02.md'


2025-11-14 17:00:01,057 - INFO - Going to convert document batch...
2025-11-14 17:00:01,059 - INFO - Processing document 4_2024-10-28
2025-11-14 17:00:01,091 - INFO - Finished converting document 4_2024-10-28 in 0.08 sec.
2025-11-14 17:00:01,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:01,141 - INFO - Going to convert document batch...
2025-11-14 17:00:01,142 - INFO - Processing document 4_2024-11-01
2025-11-14 17:00:01,167 - INFO - Finished converting document 4_2024-11-01 in 0.06 sec.
2025-11-14 17:00:01,211 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:00:01,211 - ERROR - Input document 4_2024-12-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\LMT\4_2024-10-28' --> 'data\processed_data\LMT\4_2024-10-28.md'
Converted 'data\edgar_documents\LMT\4_2024-11-01' --> 'data\processed_data\LMT\4_2024-11-01.md'
Error processing data\edgar_documents\LMT\4_2024-12-04: File format not allowed: data\edgar_documents\LMT\4_2024-12-04
Error processing data\edgar_documents\LMT\4_2024-12-05: File format not allowed: data\edgar_documents\LMT\4_2024-12-05


2025-11-14 17:00:01,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:01,456 - INFO - Going to convert document batch...
2025-11-14 17:00:01,457 - INFO - Processing document 4_2025-01-03
2025-11-14 17:00:01,507 - INFO - Finished converting document 4_2025-01-03 in 0.11 sec.
2025-11-14 17:00:01,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\4_2024-12-10' --> 'data\processed_data\LMT\4_2024-12-10.md'
Converted 'data\edgar_documents\LMT\4_2025-01-03' --> 'data\processed_data\LMT\4_2025-01-03.md'


2025-11-14 17:00:01,612 - INFO - Going to convert document batch...
2025-11-14 17:00:01,612 - INFO - Processing document 4_2025-02-19
2025-11-14 17:00:01,638 - INFO - Finished converting document 4_2025-02-19 in 0.08 sec.
2025-11-14 17:00:01,680 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:01,693 - INFO - Going to convert document batch...
2025-11-14 17:00:01,694 - INFO - Processing document 4_2025-02-25
2025-11-14 17:00:01,761 - INFO - Finished converting document 4_2025-02-25 in 0.09 sec.
2025-11-14 17:00:01,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\4_2025-02-19' --> 'data\processed_data\LMT\4_2025-02-19.md'
Converted 'data\edgar_documents\LMT\4_2025-02-25' --> 'data\processed_data\LMT\4_2025-02-25.md'


2025-11-14 17:00:01,888 - INFO - Going to convert document batch...
2025-11-14 17:00:01,889 - INFO - Processing document 4_2025-02-28
2025-11-14 17:00:01,921 - INFO - Finished converting document 4_2025-02-28 in 0.11 sec.
2025-11-14 17:00:01,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:01,981 - INFO - Going to convert document batch...
2025-11-14 17:00:01,982 - INFO - Processing document 4_2025-04-02
2025-11-14 17:00:02,018 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.
2025-11-14 17:00:02,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:02,084 - INFO - Going to convert document batch...
2025-11-14 17:00:02,085 - INFO - Processing document 4_2025-07-02
2025-11-14 17:00:02,108 - INFO - Finished converting document 4_2025-07-02 in 0.06 sec.


Converted 'data\edgar_documents\LMT\4_2025-02-28' --> 'data\processed_data\LMT\4_2025-02-28.md'
Converted 'data\edgar_documents\LMT\4_2025-04-02' --> 'data\processed_data\LMT\4_2025-04-02.md'


2025-11-14 17:00:02,157 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:00:02,158 - ERROR - Input document 4_2025-07-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:00:02,159 - INFO - Going to convert document batch...
2025-11-14 17:00:02,179 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:00:02,180 - ERROR - Input document 4_2025-07-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\LMT\4_2025-07-02' --> 'data\processed_data\LMT\4_2025-07-02.md'
Error processing data\edgar_documents\LMT\4_2025-07-23: File format not allowed: data\edgar_documents\LMT\4_2025-07-23
Error processing data\edgar_documents\LMT\4_2025-07-24: File format not allowed: data\edgar_documents\LMT\4_2025-07-24
Converted 'data\edgar_documents\LMT\4_2025-10-02' --> 'data\processed_data\LMT\4_2025-10-02.md'


2025-11-14 17:00:02,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:02,379 - INFO - Going to convert document batch...
2025-11-14 17:00:02,380 - INFO - Processing document 4_2025-10-27
2025-11-14 17:00:02,439 - INFO - Finished converting document 4_2025-10-27 in 0.17 sec.
2025-11-14 17:00:02,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:02,506 - INFO - Going to convert document batch...
2025-11-14 17:00:02,507 - INFO - Processing document 4_2025-10-28
2025-11-14 17:00:02,538 - INFO - Finished converting document 4_2025-10-28 in 0.05 sec.
2025-11-14 17:00:02,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:02,620 - INFO - Going to convert document batch...
2025-11-14 17:00:02,622 - INFO - Processing document 8-K_2023-01-24
2025-11-14 17:00:02,651 - INFO - Finished converting document 8-K_2023-01-24 in 0.09 sec.
2025-11-14 17:00:02,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\4_2025-10-27' --> 'data\processed_data\LMT\4_2025-10-27.md'
Converted 'data\edgar_documents\LMT\4_2025-10-28' --> 'data\processed_data\LMT\4_2025-10-28.md'
Converted 'data\edgar_documents\LMT\8-K_2023-01-24' --> 'data\processed_data\LMT\8-K_2023-01-24.md'


2025-11-14 17:00:02,688 - INFO - Going to convert document batch...
2025-11-14 17:00:02,689 - INFO - Processing document 8-K_2023-02-23
2025-11-14 17:00:02,723 - INFO - Finished converting document 8-K_2023-02-23 in 0.06 sec.
2025-11-14 17:00:02,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:02,766 - INFO - Going to convert document batch...
2025-11-14 17:00:02,767 - INFO - Processing document 8-K_2023-04-18
2025-11-14 17:00:02,791 - INFO - Finished converting document 8-K_2023-04-18 in 0.05 sec.
2025-11-14 17:00:02,818 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:02,841 - INFO - Going to convert document batch...
2025-11-14 17:00:02,842 - INFO - Processing document 8-K_2023-04-27
2025-11-14 17:00:02,892 - INFO - Finished converting document 8-K_2023-04-27 in 0.09 sec.


Converted 'data\edgar_documents\LMT\8-K_2023-02-23' --> 'data\processed_data\LMT\8-K_2023-02-23.md'
Converted 'data\edgar_documents\LMT\8-K_2023-04-18' --> 'data\processed_data\LMT\8-K_2023-04-18.md'
Converted 'data\edgar_documents\LMT\8-K_2023-04-27' --> 'data\processed_data\LMT\8-K_2023-04-27.md'


2025-11-14 17:00:02,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:02,985 - INFO - Going to convert document batch...
2025-11-14 17:00:02,987 - INFO - Processing document 8-K_2023-05-25
2025-11-14 17:00:03,102 - INFO - Finished converting document 8-K_2023-05-25 in 0.17 sec.
2025-11-14 17:00:03,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:03,172 - INFO - Going to convert document batch...
2025-11-14 17:00:03,173 - INFO - Processing document 8-K_2023-07-18
2025-11-14 17:00:03,198 - INFO - Finished converting document 8-K_2023-07-18 in 0.08 sec.
2025-11-14 17:00:03,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:03,239 - INFO - Going to convert document batch...
2025-11-14 17:00:03,240 - INFO - Processing document 8-K_2023-08-24
2025-11-14 17:00:03,259 - INFO - Finished converting document 8-K_2023-08-24 in 0.05 sec.
2025-11-14 17:00:03,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\LMT\8-K_2023-05-25' --> 'data\processed_data\LMT\8-K_2023-05-25.md'
Converted 'data\edgar_documents\LMT\8-K_2023-07-18' --> 'data\processed_data\LMT\8-K_2023-07-18.md'
Converted 'data\edgar_documents\LMT\8-K_2023-08-24' --> 'data\processed_data\LMT\8-K_2023-08-24.md'


2025-11-14 17:00:03,322 - INFO - Finished converting document 8-K_2023-09-06 in 0.06 sec.
2025-11-14 17:00:03,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:03,377 - INFO - Going to convert document batch...
2025-11-14 17:00:03,378 - INFO - Processing document 8-K_2023-10-17
2025-11-14 17:00:03,416 - INFO - Finished converting document 8-K_2023-10-17 in 0.08 sec.
2025-11-14 17:00:03,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:03,461 - INFO - Going to convert document batch...
2025-11-14 17:00:03,462 - INFO - Processing document 8-K_2024-01-23
2025-11-14 17:00:03,486 - INFO - Finished converting document 8-K_2024-01-23 in 0.06 sec.
2025-11-14 17:00:03,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\8-K_2023-09-06' --> 'data\processed_data\LMT\8-K_2023-09-06.md'
Converted 'data\edgar_documents\LMT\8-K_2023-10-17' --> 'data\processed_data\LMT\8-K_2023-10-17.md'
Converted 'data\edgar_documents\LMT\8-K_2024-01-23' --> 'data\processed_data\LMT\8-K_2024-01-23.md'


2025-11-14 17:00:03,523 - INFO - Going to convert document batch...
2025-11-14 17:00:03,524 - INFO - Processing document 8-K_2024-01-29
2025-11-14 17:00:03,567 - INFO - Finished converting document 8-K_2024-01-29 in 0.06 sec.
2025-11-14 17:00:03,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:03,622 - INFO - Going to convert document batch...
2025-11-14 17:00:03,622 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:00:03,647 - INFO - Finished converting document 8-K_2024-04-23 in 0.05 sec.
2025-11-14 17:00:03,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:03,691 - INFO - Going to convert document batch...
2025-11-14 17:00:03,692 - INFO - Processing document 8-K_2024-05-03
2025-11-14 17:00:03,736 - INFO - Finished converting document 8-K_2024-05-03 in 0.08 sec.
2025-11-14 17:00:03,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\8-K_2024-01-29' --> 'data\processed_data\LMT\8-K_2024-01-29.md'
Converted 'data\edgar_documents\LMT\8-K_2024-04-23' --> 'data\processed_data\LMT\8-K_2024-04-23.md'
Converted 'data\edgar_documents\LMT\8-K_2024-05-03' --> 'data\processed_data\LMT\8-K_2024-05-03.md'


2025-11-14 17:00:04,102 - INFO - Going to convert document batch...
2025-11-14 17:00:04,103 - INFO - Processing document 8-K_2024-05-22
2025-11-14 17:00:04,127 - INFO - Finished converting document 8-K_2024-05-22 in 0.38 sec.
2025-11-14 17:00:04,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,202 - INFO - Going to convert document batch...
2025-11-14 17:00:04,203 - INFO - Processing document 8-K_2024-05-24
2025-11-14 17:00:04,224 - INFO - Finished converting document 8-K_2024-05-24 in 0.08 sec.
2025-11-14 17:00:04,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,274 - INFO - Going to convert document batch...
2025-11-14 17:00:04,275 - INFO - Processing document 8-K_2024-07-19
2025-11-14 17:00:04,303 - INFO - Finished converting document 8-K_2024-07-19 in 0.06 sec.
2025-11-14 17:00:04,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\8-K_2024-05-22' --> 'data\processed_data\LMT\8-K_2024-05-22.md'
Converted 'data\edgar_documents\LMT\8-K_2024-05-24' --> 'data\processed_data\LMT\8-K_2024-05-24.md'
Converted 'data\edgar_documents\LMT\8-K_2024-07-19' --> 'data\processed_data\LMT\8-K_2024-07-19.md'


2025-11-14 17:00:04,356 - INFO - Going to convert document batch...
2025-11-14 17:00:04,357 - INFO - Processing document 8-K_2024-07-23
2025-11-14 17:00:04,393 - INFO - Finished converting document 8-K_2024-07-23 in 0.08 sec.
2025-11-14 17:00:04,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,445 - INFO - Going to convert document batch...
2025-11-14 17:00:04,446 - INFO - Processing document 8-K_2024-08-27
2025-11-14 17:00:04,476 - INFO - Finished converting document 8-K_2024-08-27 in 0.06 sec.
2025-11-14 17:00:04,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,516 - INFO - Going to convert document batch...
2025-11-14 17:00:04,516 - INFO - Processing document 8-K_2024-10-22
2025-11-14 17:00:04,535 - INFO - Finished converting document 8-K_2024-10-22 in 0.05 sec.
2025-11-14 17:00:04,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,569 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\LMT\8-K_2024-07-23' --> 'data\processed_data\LMT\8-K_2024-07-23.md'
Converted 'data\edgar_documents\LMT\8-K_2024-08-27' --> 'data\processed_data\LMT\8-K_2024-08-27.md'
Converted 'data\edgar_documents\LMT\8-K_2024-10-22' --> 'data\processed_data\LMT\8-K_2024-10-22.md'


2025-11-14 17:00:04,614 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,626 - INFO - Going to convert document batch...
2025-11-14 17:00:04,627 - INFO - Processing document 8-K_2024-12-11
2025-11-14 17:00:04,666 - INFO - Finished converting document 8-K_2024-12-11 in 0.06 sec.
2025-11-14 17:00:04,700 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,710 - INFO - Going to convert document batch...
2025-11-14 17:00:04,711 - INFO - Processing document 8-K_2025-01-28
2025-11-14 17:00:04,740 - INFO - Finished converting document 8-K_2025-01-28 in 0.05 sec.
2025-11-14 17:00:04,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,777 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LMT\8-K_2024-11-13' --> 'data\processed_data\LMT\8-K_2024-11-13.md'
Converted 'data\edgar_documents\LMT\8-K_2024-12-11' --> 'data\processed_data\LMT\8-K_2024-12-11.md'
Converted 'data\edgar_documents\LMT\8-K_2025-01-28' --> 'data\processed_data\LMT\8-K_2025-01-28.md'


2025-11-14 17:00:04,777 - INFO - Processing document 8-K_2025-04-17
2025-11-14 17:00:04,807 - INFO - Finished converting document 8-K_2025-04-17 in 0.05 sec.
2025-11-14 17:00:04,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,855 - INFO - Going to convert document batch...
2025-11-14 17:00:04,856 - INFO - Processing document 8-K_2025-04-22
2025-11-14 17:00:04,875 - INFO - Finished converting document 8-K_2025-04-22 in 0.05 sec.
2025-11-14 17:00:04,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:04,924 - INFO - Going to convert document batch...
2025-11-14 17:00:04,925 - INFO - Processing document 8-K_2025-05-09
2025-11-14 17:00:04,961 - INFO - Finished converting document 8-K_2025-05-09 in 0.06 sec.
2025-11-14 17:00:05,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:05,020 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LMT\8-K_2025-04-17' --> 'data\processed_data\LMT\8-K_2025-04-17.md'
Converted 'data\edgar_documents\LMT\8-K_2025-04-22' --> 'data\processed_data\LMT\8-K_2025-04-22.md'
Converted 'data\edgar_documents\LMT\8-K_2025-05-09' --> 'data\processed_data\LMT\8-K_2025-05-09.md'


2025-11-14 17:00:05,020 - INFO - Processing document 8-K_2025-07-22
2025-11-14 17:00:05,048 - INFO - Finished converting document 8-K_2025-07-22 in 0.08 sec.
2025-11-14 17:00:05,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:05,092 - INFO - Going to convert document batch...
2025-11-14 17:00:05,093 - INFO - Processing document 8-K_2025-07-28
2025-11-14 17:00:05,122 - INFO - Finished converting document 8-K_2025-07-28 in 0.06 sec.
2025-11-14 17:00:05,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:05,162 - INFO - Going to convert document batch...
2025-11-14 17:00:05,165 - INFO - Processing document 8-K_2025-08-29
2025-11-14 17:00:05,184 - INFO - Finished converting document 8-K_2025-08-29 in 0.05 sec.
2025-11-14 17:00:05,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:05,220 - INFO - Going to convert document batch...
2025-11-14 17:00:05,221 - INFO - Processing document 8-K_2025-10-21
2025-11-14 17:

Converted 'data\edgar_documents\LMT\8-K_2025-07-22' --> 'data\processed_data\LMT\8-K_2025-07-22.md'
Converted 'data\edgar_documents\LMT\8-K_2025-07-28' --> 'data\processed_data\LMT\8-K_2025-07-28.md'
Converted 'data\edgar_documents\LMT\8-K_2025-08-29' --> 'data\processed_data\LMT\8-K_2025-08-29.md'


2025-11-14 17:00:05,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\8-K_2025-10-21' --> 'data\processed_data\LMT\8-K_2025-10-21.md'


2025-11-14 17:00:05,982 - INFO - Going to convert document batch...
2025-11-14 17:00:05,983 - INFO - Processing document DEF-14A_2023-03-14
2025-11-14 17:00:10,325 - INFO - Finished converting document DEF-14A_2023-03-14 in 5.08 sec.
2025-11-14 17:00:12,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\DEF-14A_2023-03-14' --> 'data\processed_data\LMT\DEF-14A_2023-03-14.md'


2025-11-14 17:00:13,567 - INFO - Going to convert document batch...
2025-11-14 17:00:13,567 - INFO - Processing document DEF-14A_2024-03-15
2025-11-14 17:00:21,098 - INFO - Finished converting document DEF-14A_2024-03-15 in 8.83 sec.
2025-11-14 17:00:23,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\DEF-14A_2024-03-15' --> 'data\processed_data\LMT\DEF-14A_2024-03-15.md'


2025-11-14 17:00:24,606 - INFO - Going to convert document batch...
2025-11-14 17:00:24,607 - INFO - Processing document DEF-14A_2025-03-27
2025-11-14 17:00:32,020 - INFO - Finished converting document DEF-14A_2025-03-27 in 8.66 sec.
2025-11-14 17:00:34,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LMT\DEF-14A_2025-03-27' --> 'data\processed_data\LMT\DEF-14A_2025-03-27.md'
Processed 86 new files. Errors: 8
Found 86 files to process in data\edgar_documents\LOW


2025-11-14 17:00:34,979 - INFO - Going to convert document batch...
2025-11-14 17:00:34,980 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:00:34,981 - INFO - Processing document 10-K_2023-03-27
2025-11-14 17:00:37,274 - INFO - Finished converting document 10-K_2023-03-27 in 3.00 sec.
2025-11-14 17:00:38,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-K_2023-03-27' --> 'data\processed_data\LOW\10-K_2023-03-27.md'


2025-11-14 17:00:39,453 - INFO - Going to convert document batch...
2025-11-14 17:00:39,455 - INFO - Processing document 10-K_2024-03-25
2025-11-14 17:00:41,774 - INFO - Finished converting document 10-K_2024-03-25 in 3.78 sec.
2025-11-14 17:00:42,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-K_2024-03-25' --> 'data\processed_data\LOW\10-K_2024-03-25.md'


2025-11-14 17:00:43,294 - INFO - Going to convert document batch...
2025-11-14 17:00:43,295 - INFO - Processing document 10-K_2025-03-24
2025-11-14 17:00:45,919 - INFO - Finished converting document 10-K_2025-03-24 in 3.44 sec.
2025-11-14 17:00:46,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-K_2025-03-24' --> 'data\processed_data\LOW\10-K_2025-03-24.md'


2025-11-14 17:00:46,959 - INFO - Going to convert document batch...
2025-11-14 17:00:46,959 - INFO - Processing document 10-Q_2023-06-01
2025-11-14 17:00:47,588 - INFO - Finished converting document 10-Q_2023-06-01 in 1.03 sec.
2025-11-14 17:00:48,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-Q_2023-06-01' --> 'data\processed_data\LOW\10-Q_2023-06-01.md'


2025-11-14 17:00:48,392 - INFO - Going to convert document batch...
2025-11-14 17:00:48,392 - INFO - Processing document 10-Q_2023-08-30
2025-11-14 17:00:49,052 - INFO - Finished converting document 10-Q_2023-08-30 in 1.11 sec.
2025-11-14 17:00:49,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-Q_2023-08-30' --> 'data\processed_data\LOW\10-Q_2023-08-30.md'


2025-11-14 17:00:50,195 - INFO - Going to convert document batch...
2025-11-14 17:00:50,196 - INFO - Processing document 10-Q_2023-11-29
2025-11-14 17:00:50,999 - INFO - Finished converting document 10-Q_2023-11-29 in 1.61 sec.
2025-11-14 17:00:51,389 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-Q_2023-11-29' --> 'data\processed_data\LOW\10-Q_2023-11-29.md'


2025-11-14 17:00:51,653 - INFO - Going to convert document batch...
2025-11-14 17:00:51,654 - INFO - Processing document 10-Q_2024-05-30
2025-11-14 17:00:52,206 - INFO - Finished converting document 10-Q_2024-05-30 in 0.84 sec.
2025-11-14 17:00:52,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-Q_2024-05-30' --> 'data\processed_data\LOW\10-Q_2024-05-30.md'


2025-11-14 17:00:53,572 - INFO - Going to convert document batch...
2025-11-14 17:00:53,573 - INFO - Processing document 10-Q_2024-08-29
2025-11-14 17:00:54,205 - INFO - Finished converting document 10-Q_2024-08-29 in 1.67 sec.
2025-11-14 17:00:54,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-Q_2024-08-29' --> 'data\processed_data\LOW\10-Q_2024-08-29.md'


2025-11-14 17:00:54,949 - INFO - Going to convert document batch...
2025-11-14 17:00:54,950 - INFO - Processing document 10-Q_2024-11-27
2025-11-14 17:00:55,723 - INFO - Finished converting document 10-Q_2024-11-27 in 1.16 sec.
2025-11-14 17:00:56,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-Q_2024-11-27' --> 'data\processed_data\LOW\10-Q_2024-11-27.md'


2025-11-14 17:00:56,682 - INFO - Going to convert document batch...
2025-11-14 17:00:56,683 - INFO - Processing document 10-Q_2025-05-29
2025-11-14 17:00:57,244 - INFO - Finished converting document 10-Q_2025-05-29 in 0.92 sec.
2025-11-14 17:00:57,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-Q_2025-05-29' --> 'data\processed_data\LOW\10-Q_2025-05-29.md'


2025-11-14 17:00:57,920 - INFO - Going to convert document batch...
2025-11-14 17:00:57,921 - INFO - Processing document 10-Q_2025-08-28
2025-11-14 17:00:58,831 - INFO - Finished converting document 10-Q_2025-08-28 in 1.25 sec.
2025-11-14 17:00:59,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:59,580 - INFO - Going to convert document batch...
2025-11-14 17:00:59,582 - INFO - Processing document 4_2023-01-03
2025-11-14 17:00:59,612 - INFO - Finished converting document 4_2023-01-03 in 0.06 sec.
2025-11-14 17:00:59,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:59,664 - INFO - Going to convert document batch...
2025-11-14 17:00:59,664 - INFO - Processing document 4_2023-01-31
2025-11-14 17:00:59,687 - INFO - Finished converting document 4_2023-01-31 in 0.05 sec.
2025-11-14 17:00:59,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\10-Q_2025-08-28' --> 'data\processed_data\LOW\10-Q_2025-08-28.md'
Converted 'data\edgar_documents\LOW\4_2023-01-03' --> 'data\processed_data\LOW\4_2023-01-03.md'
Converted 'data\edgar_documents\LOW\4_2023-01-31' --> 'data\processed_data\LOW\4_2023-01-31.md'


2025-11-14 17:00:59,742 - INFO - Going to convert document batch...
2025-11-14 17:00:59,742 - INFO - Processing document 4_2023-03-13
2025-11-14 17:00:59,777 - INFO - Finished converting document 4_2023-03-13 in 0.06 sec.
2025-11-14 17:00:59,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:59,835 - INFO - Going to convert document batch...
2025-11-14 17:00:59,835 - INFO - Processing document 4_2023-03-16
2025-11-14 17:00:59,860 - INFO - Finished converting document 4_2023-03-16 in 0.05 sec.
2025-11-14 17:00:59,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:00:59,906 - INFO - Going to convert document batch...
2025-11-14 17:00:59,907 - INFO - Processing document 4_2023-03-27
2025-11-14 17:00:59,936 - INFO - Finished converting document 4_2023-03-27 in 0.05 sec.
2025-11-14 17:00:59,995 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\LOW\4_2023-03-13' --> 'data\processed_data\LOW\4_2023-03-13.md'
Converted 'data\edgar_documents\LOW\4_2023-03-16' --> 'data\processed_data\LOW\4_2023-03-16.md'
Converted 'data\edgar_documents\LOW\4_2023-03-27' --> 'data\processed_data\LOW\4_2023-03-27.md'


2025-11-14 17:00:59,996 - ERROR - Input document 4_2023-03-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:00:59,998 - INFO - Going to convert document batch...
2025-11-14 17:01:00,018 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:01:00,019 - ERROR - Input document 4_2023-03-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\LOW\4_2023-03-28: File format not allowed: data\edgar_documents\LOW\4_2023-03-28
Error processing data\edgar_documents\LOW\4_2023-03-29: File format not allowed: data\edgar_documents\LOW\4_2023-03-29
Converted 'data\edgar_documents\LOW\4_2023-04-03' --> 'data\processed_data\LOW\4_2023-04-03.md'


2025-11-14 17:01:00,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:00,245 - INFO - Going to convert document batch...
2025-11-14 17:01:00,246 - INFO - Processing document 4_2023-05-30
2025-11-14 17:01:00,287 - INFO - Finished converting document 4_2023-05-30 in 0.06 sec.
2025-11-14 17:01:00,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:00,398 - INFO - Going to convert document batch...
2025-11-14 17:01:00,399 - INFO - Processing document 4_2023-06-20


Converted 'data\edgar_documents\LOW\4_2023-04-04' --> 'data\processed_data\LOW\4_2023-04-04.md'
Converted 'data\edgar_documents\LOW\4_2023-05-30' --> 'data\processed_data\LOW\4_2023-05-30.md'


2025-11-14 17:01:00,425 - INFO - Finished converting document 4_2023-06-20 in 0.09 sec.
2025-11-14 17:01:00,471 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:00,485 - INFO - Going to convert document batch...
2025-11-14 17:01:00,486 - INFO - Processing document 4_2023-07-05
2025-11-14 17:01:00,515 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.


Converted 'data\edgar_documents\LOW\4_2023-06-20' --> 'data\processed_data\LOW\4_2023-06-20.md'
Converted 'data\edgar_documents\LOW\4_2023-07-05' --> 'data\processed_data\LOW\4_2023-07-05.md'


2025-11-14 17:01:00,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:00,671 - INFO - Going to convert document batch...
2025-11-14 17:01:00,672 - INFO - Processing document 4_2023-08-29
2025-11-14 17:01:00,702 - INFO - Finished converting document 4_2023-08-29 in 0.09 sec.
2025-11-14 17:01:00,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:00,752 - INFO - Going to convert document batch...
2025-11-14 17:01:00,753 - INFO - Processing document 4_2023-09-05
2025-11-14 17:01:00,775 - INFO - Finished converting document 4_2023-09-05 in 0.05 sec.
2025-11-14 17:01:00,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:00,821 - INFO - Going to convert document batch...
2025-11-14 17:01:00,822 - INFO - Processing document 4_2023-09-19
2025-11-14 17:01:00,850 - INFO - Finished converting document 4_2023-09-19 in 0.05 sec.
2025-11-14 17:01:00,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\4_2023-08-29' --> 'data\processed_data\LOW\4_2023-08-29.md'
Converted 'data\edgar_documents\LOW\4_2023-09-05' --> 'data\processed_data\LOW\4_2023-09-05.md'
Converted 'data\edgar_documents\LOW\4_2023-09-19' --> 'data\processed_data\LOW\4_2023-09-19.md'


2025-11-14 17:01:00,915 - INFO - Going to convert document batch...
2025-11-14 17:01:00,916 - INFO - Processing document 4_2023-10-03
2025-11-14 17:01:00,948 - INFO - Finished converting document 4_2023-10-03 in 0.08 sec.
2025-11-14 17:01:01,002 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,015 - INFO - Going to convert document batch...
2025-11-14 17:01:01,015 - INFO - Processing document 4_2024-01-03
2025-11-14 17:01:01,036 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 17:01:01,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,088 - INFO - Going to convert document batch...
2025-11-14 17:01:01,089 - INFO - Processing document 4_2024-03-05
2025-11-14 17:01:01,113 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 17:01:01,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,164 - INFO - Going to convert document batch...
2025-11-14 17:01:01,165 - 

Converted 'data\edgar_documents\LOW\4_2023-10-03' --> 'data\processed_data\LOW\4_2023-10-03.md'
Converted 'data\edgar_documents\LOW\4_2024-01-03' --> 'data\processed_data\LOW\4_2024-01-03.md'
Converted 'data\edgar_documents\LOW\4_2024-03-05' --> 'data\processed_data\LOW\4_2024-03-05.md'


2025-11-14 17:01:01,200 - INFO - Finished converting document 4_2024-03-11 in 0.06 sec.
2025-11-14 17:01:01,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,259 - INFO - Going to convert document batch...
2025-11-14 17:01:01,260 - INFO - Processing document 4_2024-03-19
2025-11-14 17:01:01,370 - INFO - Finished converting document 4_2024-03-19 in 0.14 sec.


Converted 'data\edgar_documents\LOW\4_2024-03-11' --> 'data\processed_data\LOW\4_2024-03-11.md'
Converted 'data\edgar_documents\LOW\4_2024-03-19' --> 'data\processed_data\LOW\4_2024-03-19.md'


2025-11-14 17:01:01,471 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,491 - INFO - Going to convert document batch...
2025-11-14 17:01:01,492 - INFO - Processing document 4_2024-03-25
2025-11-14 17:01:01,529 - INFO - Finished converting document 4_2024-03-25 in 0.12 sec.
2025-11-14 17:01:01,580 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,590 - INFO - Going to convert document batch...
2025-11-14 17:01:01,591 - INFO - Processing document 4_2024-04-02
2025-11-14 17:01:01,618 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 17:01:01,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,667 - INFO - Going to convert document batch...
2025-11-14 17:01:01,668 - INFO - Processing document 4_2024-04-03
2025-11-14 17:01:01,692 - INFO - Finished converting document 4_2024-04-03 in 0.05 sec.
2025-11-14 17:01:01,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\LOW\4_2024-03-25' --> 'data\processed_data\LOW\4_2024-03-25.md'
Converted 'data\edgar_documents\LOW\4_2024-04-02' --> 'data\processed_data\LOW\4_2024-04-02.md'
Converted 'data\edgar_documents\LOW\4_2024-04-03' --> 'data\processed_data\LOW\4_2024-04-03.md'


2025-11-14 17:01:01,753 - INFO - Processing document 4_2024-06-04
2025-11-14 17:01:01,780 - INFO - Finished converting document 4_2024-06-04 in 0.06 sec.
2025-11-14 17:01:01,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,834 - INFO - Going to convert document batch...
2025-11-14 17:01:01,834 - INFO - Processing document 4_2024-06-18
2025-11-14 17:01:01,854 - INFO - Finished converting document 4_2024-06-18 in 0.05 sec.
2025-11-14 17:01:01,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,902 - INFO - Going to convert document batch...
2025-11-14 17:01:01,902 - INFO - Processing document 4_2024-07-02
2025-11-14 17:01:01,925 - INFO - Finished converting document 4_2024-07-02 in 0.05 sec.
2025-11-14 17:01:01,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:01,980 - INFO - Going to convert document batch...
2025-11-14 17:01:01,981 - INFO - Processing document 4_2024-09-16


Converted 'data\edgar_documents\LOW\4_2024-06-04' --> 'data\processed_data\LOW\4_2024-06-04.md'
Converted 'data\edgar_documents\LOW\4_2024-06-18' --> 'data\processed_data\LOW\4_2024-06-18.md'
Converted 'data\edgar_documents\LOW\4_2024-07-02' --> 'data\processed_data\LOW\4_2024-07-02.md'


2025-11-14 17:01:02,007 - INFO - Finished converting document 4_2024-09-16 in 0.05 sec.
2025-11-14 17:01:02,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:02,150 - INFO - Going to convert document batch...
2025-11-14 17:01:02,151 - INFO - Processing document 4_2024-09-17
2025-11-14 17:01:02,179 - INFO - Finished converting document 4_2024-09-17 in 0.14 sec.


Converted 'data\edgar_documents\LOW\4_2024-09-16' --> 'data\processed_data\LOW\4_2024-09-16.md'
Converted 'data\edgar_documents\LOW\4_2024-09-17' --> 'data\processed_data\LOW\4_2024-09-17.md'


2025-11-14 17:01:02,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:02,258 - INFO - Going to convert document batch...
2025-11-14 17:01:02,259 - INFO - Processing document 4_2024-10-02
2025-11-14 17:01:02,289 - INFO - Finished converting document 4_2024-10-02 in 0.08 sec.
2025-11-14 17:01:02,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:02,423 - INFO - Going to convert document batch...
2025-11-14 17:01:02,424 - INFO - Processing document 4_2024-10-03
2025-11-14 17:01:02,450 - INFO - Finished converting document 4_2024-10-03 in 0.09 sec.
2025-11-14 17:01:02,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:02,497 - INFO - Going to convert document batch...
2025-11-14 17:01:02,498 - INFO - Processing document 4_2024-10-04
2025-11-14 17:01:02,519 - INFO - Finished converting document 4_2024-10-04 in 0.05 sec.


Converted 'data\edgar_documents\LOW\4_2024-10-02' --> 'data\processed_data\LOW\4_2024-10-02.md'
Converted 'data\edgar_documents\LOW\4_2024-10-03' --> 'data\processed_data\LOW\4_2024-10-03.md'
Converted 'data\edgar_documents\LOW\4_2024-10-04' --> 'data\processed_data\LOW\4_2024-10-04.md'


2025-11-14 17:01:02,558 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:02,570 - INFO - Going to convert document batch...
2025-11-14 17:01:02,571 - INFO - Processing document 4_2024-11-29
2025-11-14 17:01:02,600 - INFO - Finished converting document 4_2024-11-29 in 0.05 sec.
2025-11-14 17:01:02,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:02,649 - INFO - Going to convert document batch...
2025-11-14 17:01:02,650 - INFO - Processing document 4_2024-12-23
2025-11-14 17:01:02,670 - INFO - Finished converting document 4_2024-12-23 in 0.05 sec.
2025-11-14 17:01:02,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:02,715 - INFO - Going to convert document batch...
2025-11-14 17:01:02,716 - INFO - Processing document 4_2025-01-02
2025-11-14 17:01:02,737 - INFO - Finished converting document 4_2025-01-02 in 0.05 sec.
2025-11-14 17:01:02,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\LOW\4_2024-11-29' --> 'data\processed_data\LOW\4_2024-11-29.md'
Converted 'data\edgar_documents\LOW\4_2024-12-23' --> 'data\processed_data\LOW\4_2024-12-23.md'
Converted 'data\edgar_documents\LOW\4_2025-01-02' --> 'data\processed_data\LOW\4_2025-01-02.md'
Converted 'data\edgar_documents\LOW\4_2025-03-24' --> 'data\processed_data\LOW\4_2025-03-24.md'


2025-11-14 17:01:02,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:02,852 - INFO - Going to convert document batch...
2025-11-14 17:01:02,853 - INFO - Processing document 4_2025-04-02
2025-11-14 17:01:02,881 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.
2025-11-14 17:01:02,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:02,931 - INFO - Going to convert document batch...
2025-11-14 17:01:02,932 - INFO - Processing document 4_2025-04-03
2025-11-14 17:01:02,959 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.
2025-11-14 17:01:02,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:03,006 - INFO - Going to convert document batch...
2025-11-14 17:01:03,007 - INFO - Processing document 4_2025-06-03
2025-11-14 17:01:03,036 - INFO - Finished converting document 4_2025-06-03 in 0.05 sec.
2025-11-14 17:01:03,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\LOW\4_2025-04-02' --> 'data\processed_data\LOW\4_2025-04-02.md'
Converted 'data\edgar_documents\LOW\4_2025-04-03' --> 'data\processed_data\LOW\4_2025-04-03.md'
Converted 'data\edgar_documents\LOW\4_2025-06-03' --> 'data\processed_data\LOW\4_2025-06-03.md'


2025-11-14 17:01:03,106 - INFO - Finished converting document 4_2025-06-05 in 0.05 sec.
2025-11-14 17:01:03,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:03,158 - INFO - Going to convert document batch...
2025-11-14 17:01:03,159 - INFO - Processing document 4_2025-06-12
2025-11-14 17:01:03,189 - INFO - Finished converting document 4_2025-06-12 in 0.06 sec.
2025-11-14 17:01:03,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:03,248 - INFO - Going to convert document batch...
2025-11-14 17:01:03,250 - INFO - Processing document 4_2025-06-17
2025-11-14 17:01:03,269 - INFO - Finished converting document 4_2025-06-17 in 0.05 sec.
2025-11-14 17:01:03,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:03,314 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LOW\4_2025-06-05' --> 'data\processed_data\LOW\4_2025-06-05.md'
Converted 'data\edgar_documents\LOW\4_2025-06-12' --> 'data\processed_data\LOW\4_2025-06-12.md'
Converted 'data\edgar_documents\LOW\4_2025-06-17' --> 'data\processed_data\LOW\4_2025-06-17.md'


2025-11-14 17:01:03,314 - INFO - Processing document 4_2025-07-02
2025-11-14 17:01:03,341 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 17:01:03,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:03,399 - INFO - Going to convert document batch...
2025-11-14 17:01:03,400 - INFO - Processing document 4_2025-08-21
2025-11-14 17:01:03,425 - INFO - Finished converting document 4_2025-08-21 in 0.05 sec.
2025-11-14 17:01:03,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:03,487 - INFO - Going to convert document batch...
2025-11-14 17:01:03,488 - INFO - Processing document 4_2025-08-27
2025-11-14 17:01:03,512 - INFO - Finished converting document 4_2025-08-27 in 0.06 sec.
2025-11-14 17:01:03,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:03,572 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LOW\4_2025-07-02' --> 'data\processed_data\LOW\4_2025-07-02.md'
Converted 'data\edgar_documents\LOW\4_2025-08-21' --> 'data\processed_data\LOW\4_2025-08-21.md'
Converted 'data\edgar_documents\LOW\4_2025-08-27' --> 'data\processed_data\LOW\4_2025-08-27.md'


2025-11-14 17:01:03,572 - INFO - Processing document 4_2025-09-08
2025-11-14 17:01:03,600 - INFO - Finished converting document 4_2025-09-08 in 0.06 sec.
2025-11-14 17:01:03,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:03,656 - INFO - Going to convert document batch...
2025-11-14 17:01:03,657 - INFO - Processing document 4_2025-09-12
2025-11-14 17:01:03,771 - INFO - Finished converting document 4_2025-09-12 in 0.14 sec.


Converted 'data\edgar_documents\LOW\4_2025-09-08' --> 'data\processed_data\LOW\4_2025-09-08.md'


2025-11-14 17:01:03,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:03,839 - INFO - Going to convert document batch...
2025-11-14 17:01:03,840 - INFO - Processing document 4_2025-09-16
2025-11-14 17:01:03,878 - INFO - Finished converting document 4_2025-09-16 in 0.06 sec.
2025-11-14 17:01:03,972 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:01:03,973 - ERROR - Input document 4_2025-09-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:01

Converted 'data\edgar_documents\LOW\4_2025-09-12' --> 'data\processed_data\LOW\4_2025-09-12.md'
Converted 'data\edgar_documents\LOW\4_2025-09-16' --> 'data\processed_data\LOW\4_2025-09-16.md'
Error processing data\edgar_documents\LOW\4_2025-09-23: File format not allowed: data\edgar_documents\LOW\4_2025-09-23


2025-11-14 17:01:03,998 - ERROR - Input document 4_2025-09-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:01:03,999 - INFO - Going to convert document batch...
2025-11-14 17:01:04,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:04,029 - INFO - Going to convert document batch...
2025-11-14 17:01:04,030 - INFO - Processing document 4_2025-10-02
2025-11-14 17:01:04,056 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.


Error processing data\edgar_documents\LOW\4_2025-09-25: File format not allowed: data\edgar_documents\LOW\4_2025-09-25
Converted 'data\edgar_documents\LOW\4_2025-10-02' --> 'data\processed_data\LOW\4_2025-10-02.md'


2025-11-14 17:01:04,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:04,280 - INFO - Going to convert document batch...
2025-11-14 17:01:04,282 - INFO - Processing document 8-K_2023-01-23
2025-11-14 17:01:04,313 - INFO - Finished converting document 8-K_2023-01-23 in 0.16 sec.
2025-11-14 17:01:04,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:04,401 - INFO - Going to convert document batch...
2025-11-14 17:01:04,402 - INFO - Processing document 8-K_2023-03-01
2025-11-14 17:01:04,425 - INFO - Finished converting document 8-K_2023-03-01 in 0.09 sec.
2025-11-14 17:01:04,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:04,468 - INFO - Going to convert document batch...
2025-11-14 17:01:04,469 - INFO - Processing document 8-K_2023-03-30
2025-11-14 17:01:04,502 - INFO - Finished converting document 8-K_2023-03-30 in 0.06 sec.
2025-11-14 17:01:04,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\8-K_2023-01-23' --> 'data\processed_data\LOW\8-K_2023-01-23.md'
Converted 'data\edgar_documents\LOW\8-K_2023-03-01' --> 'data\processed_data\LOW\8-K_2023-03-01.md'
Converted 'data\edgar_documents\LOW\8-K_2023-03-30' --> 'data\processed_data\LOW\8-K_2023-03-30.md'


2025-11-14 17:01:04,551 - INFO - Going to convert document batch...
2025-11-14 17:01:04,552 - INFO - Processing document 8-K_2023-05-23
2025-11-14 17:01:04,582 - INFO - Finished converting document 8-K_2023-05-23 in 0.06 sec.
2025-11-14 17:01:04,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:04,632 - INFO - Going to convert document batch...
2025-11-14 17:01:04,633 - INFO - Processing document 8-K_2023-06-01
2025-11-14 17:01:04,665 - INFO - Finished converting document 8-K_2023-06-01 in 0.06 sec.
2025-11-14 17:01:04,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:04,707 - INFO - Going to convert document batch...
2025-11-14 17:01:04,708 - INFO - Processing document 8-K_2023-08-22
2025-11-14 17:01:04,727 - INFO - Finished converting document 8-K_2023-08-22 in 0.03 sec.
2025-11-14 17:01:04,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:04,767 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\LOW\8-K_2023-05-23' --> 'data\processed_data\LOW\8-K_2023-05-23.md'
Converted 'data\edgar_documents\LOW\8-K_2023-06-01' --> 'data\processed_data\LOW\8-K_2023-06-01.md'
Converted 'data\edgar_documents\LOW\8-K_2023-08-22' --> 'data\processed_data\LOW\8-K_2023-08-22.md'


2025-11-14 17:01:04,788 - INFO - Finished converting document 8-K_2023-09-07 in 0.05 sec.
2025-11-14 17:01:04,818 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:04,834 - INFO - Going to convert document batch...
2025-11-14 17:01:04,837 - INFO - Processing document 8-K_2023-10-25
2025-11-14 17:01:04,903 - INFO - Finished converting document 8-K_2023-10-25 in 0.11 sec.
2025-11-14 17:01:04,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\8-K_2023-09-07' --> 'data\processed_data\LOW\8-K_2023-09-07.md'
Converted 'data\edgar_documents\LOW\8-K_2023-10-25' --> 'data\processed_data\LOW\8-K_2023-10-25.md'


2025-11-14 17:01:05,013 - INFO - Going to convert document batch...
2025-11-14 17:01:05,014 - INFO - Processing document 8-K_2023-11-21
2025-11-14 17:01:05,043 - INFO - Finished converting document 8-K_2023-11-21 in 0.08 sec.
2025-11-14 17:01:05,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,088 - INFO - Going to convert document batch...
2025-11-14 17:01:05,089 - INFO - Processing document 8-K_2024-02-27
2025-11-14 17:01:05,119 - INFO - Finished converting document 8-K_2024-02-27 in 0.06 sec.
2025-11-14 17:01:05,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,163 - INFO - Going to convert document batch...
2025-11-14 17:01:05,164 - INFO - Processing document 8-K_2024-05-21
2025-11-14 17:01:05,192 - INFO - Finished converting document 8-K_2024-05-21 in 0.06 sec.
2025-11-14 17:01:05,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,266 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\LOW\8-K_2023-11-21' --> 'data\processed_data\LOW\8-K_2023-11-21.md'
Converted 'data\edgar_documents\LOW\8-K_2024-02-27' --> 'data\processed_data\LOW\8-K_2024-02-27.md'
Converted 'data\edgar_documents\LOW\8-K_2024-05-21' --> 'data\processed_data\LOW\8-K_2024-05-21.md'


2025-11-14 17:01:05,268 - INFO - Processing document 8-K_2024-06-05
2025-11-14 17:01:05,331 - INFO - Finished converting document 8-K_2024-06-05 in 0.12 sec.
2025-11-14 17:01:05,389 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,401 - INFO - Going to convert document batch...
2025-11-14 17:01:05,402 - INFO - Processing document 8-K_2024-08-20
2025-11-14 17:01:05,423 - INFO - Finished converting document 8-K_2024-08-20 in 0.06 sec.
2025-11-14 17:01:05,454 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,467 - INFO - Going to convert document batch...
2025-11-14 17:01:05,468 - INFO - Processing document 8-K_2024-11-19
2025-11-14 17:01:05,495 - INFO - Finished converting document 8-K_2024-11-19 in 0.06 sec.
2025-11-14 17:01:05,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,535 - INFO - Going to convert document batch...
2025-11-14 17:01:05,536 - INFO - Processing document 8-K_2024-12-11
2025-11-14 17:

Converted 'data\edgar_documents\LOW\8-K_2024-06-05' --> 'data\processed_data\LOW\8-K_2024-06-05.md'
Converted 'data\edgar_documents\LOW\8-K_2024-08-20' --> 'data\processed_data\LOW\8-K_2024-08-20.md'
Converted 'data\edgar_documents\LOW\8-K_2024-11-19' --> 'data\processed_data\LOW\8-K_2024-11-19.md'


2025-11-14 17:01:05,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,601 - INFO - Going to convert document batch...
2025-11-14 17:01:05,602 - INFO - Processing document 8-K_2025-02-26
2025-11-14 17:01:05,637 - INFO - Finished converting document 8-K_2025-02-26 in 0.06 sec.


Converted 'data\edgar_documents\LOW\8-K_2024-12-11' --> 'data\processed_data\LOW\8-K_2024-12-11.md'
Converted 'data\edgar_documents\LOW\8-K_2025-02-26' --> 'data\processed_data\LOW\8-K_2025-02-26.md'


2025-11-14 17:01:05,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,787 - INFO - Going to convert document batch...
2025-11-14 17:01:05,787 - INFO - Processing document 8-K_2025-05-21
2025-11-14 17:01:05,815 - INFO - Finished converting document 8-K_2025-05-21 in 0.08 sec.
2025-11-14 17:01:05,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,859 - INFO - Going to convert document batch...
2025-11-14 17:01:05,861 - INFO - Processing document 8-K_2025-06-05
2025-11-14 17:01:05,888 - INFO - Finished converting document 8-K_2025-06-05 in 0.06 sec.
2025-11-14 17:01:05,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:05,934 - INFO - Going to convert document batch...
2025-11-14 17:01:05,935 - INFO - Processing document 8-K_2025-08-20
2025-11-14 17:01:05,966 - INFO - Finished converting document 8-K_2025-08-20 in 0.06 sec.
2025-11-14 17:01:06,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\8-K_2025-05-21' --> 'data\processed_data\LOW\8-K_2025-05-21.md'
Converted 'data\edgar_documents\LOW\8-K_2025-06-05' --> 'data\processed_data\LOW\8-K_2025-06-05.md'
Converted 'data\edgar_documents\LOW\8-K_2025-08-20' --> 'data\processed_data\LOW\8-K_2025-08-20.md'


2025-11-14 17:01:06,021 - INFO - Going to convert document batch...
2025-11-14 17:01:06,022 - INFO - Processing document 8-K_2025-09-19
2025-11-14 17:01:06,071 - INFO - Finished converting document 8-K_2025-09-19 in 0.08 sec.
2025-11-14 17:01:06,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\LOW\8-K_2025-09-19' --> 'data\processed_data\LOW\8-K_2025-09-19.md'


2025-11-14 17:01:06,414 - INFO - Going to convert document batch...
2025-11-14 17:01:06,414 - INFO - Processing document 8-K_2025-09-30
2025-11-14 17:01:06,452 - INFO - Finished converting document 8-K_2025-09-30 in 0.36 sec.
2025-11-14 17:01:06,530 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:06,577 - INFO - Going to convert document batch...
2025-11-14 17:01:06,578 - INFO - Processing document 8-K_2025-10-09
2025-11-14 17:01:06,629 - INFO - Finished converting document 8-K_2025-10-09 in 0.14 sec.


Converted 'data\edgar_documents\LOW\8-K_2025-09-30' --> 'data\processed_data\LOW\8-K_2025-09-30.md'
Converted 'data\edgar_documents\LOW\8-K_2025-10-09' --> 'data\processed_data\LOW\8-K_2025-10-09.md'


2025-11-14 17:01:06,712 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:01:06,713 - ERROR - Input document DEF-14A_2023-04-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:01:06,715 - INFO - Going to convert document batch...
2025-11-14 17:01:06,764 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:01:06,765 - ERROR - Input document DEF-14A_2024-04-18 with format No

Error processing data\edgar_documents\LOW\DEF-14A_2023-04-13: File format not allowed: data\edgar_documents\LOW\DEF-14A_2023-04-13
Error processing data\edgar_documents\LOW\DEF-14A_2024-04-18: File format not allowed: data\edgar_documents\LOW\DEF-14A_2024-04-18
Error processing data\edgar_documents\LOW\DEF-14A_2025-04-17: File format not allowed: data\edgar_documents\LOW\DEF-14A_2025-04-17
Processed 79 new files. Errors: 7
Found 184 files to process in data\edgar_documents\MA


2025-11-14 17:01:06,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:08,076 - INFO - Going to convert document batch...
2025-11-14 17:01:08,077 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:01:08,078 - INFO - Processing document 10-K_2023-02-14
2025-11-14 17:01:10,911 - INFO - Finished converting document 10-K_2023-02-14 in 4.09 sec.
2025-11-14 17:01:12,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-K_2023-02-14' --> 'data\processed_data\MA\10-K_2023-02-14.md'


2025-11-14 17:01:13,710 - INFO - Going to convert document batch...
2025-11-14 17:01:13,711 - INFO - Processing document 10-K_2024-02-13
2025-11-14 17:01:17,587 - INFO - Finished converting document 10-K_2024-02-13 in 5.30 sec.
2025-11-14 17:01:19,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-K_2024-02-13' --> 'data\processed_data\MA\10-K_2024-02-13.md'


2025-11-14 17:01:21,385 - INFO - Going to convert document batch...
2025-11-14 17:01:21,387 - INFO - Processing document 10-K_2025-02-12
2025-11-14 17:01:24,269 - INFO - Finished converting document 10-K_2025-02-12 in 4.97 sec.
2025-11-14 17:01:25,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-K_2025-02-12' --> 'data\processed_data\MA\10-K_2025-02-12.md'


2025-11-14 17:01:26,326 - INFO - Going to convert document batch...
2025-11-14 17:01:26,327 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 17:01:28,319 - INFO - Finished converting document 10-Q_2023-04-27 in 2.67 sec.
2025-11-14 17:01:28,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-Q_2023-04-27' --> 'data\processed_data\MA\10-Q_2023-04-27.md'


2025-11-14 17:01:29,596 - INFO - Going to convert document batch...
2025-11-14 17:01:29,597 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 17:01:31,117 - INFO - Finished converting document 10-Q_2023-07-27 in 2.23 sec.
2025-11-14 17:01:31,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-Q_2023-07-27' --> 'data\processed_data\MA\10-Q_2023-07-27.md'


2025-11-14 17:01:33,053 - INFO - Going to convert document batch...
2025-11-14 17:01:33,054 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 17:01:34,359 - INFO - Finished converting document 10-Q_2023-10-26 in 2.53 sec.
2025-11-14 17:01:35,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-Q_2023-10-26' --> 'data\processed_data\MA\10-Q_2023-10-26.md'


2025-11-14 17:01:36,249 - INFO - Going to convert document batch...
2025-11-14 17:01:36,250 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 17:01:37,181 - INFO - Finished converting document 10-Q_2024-05-01 in 1.97 sec.
2025-11-14 17:01:37,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-Q_2024-05-01' --> 'data\processed_data\MA\10-Q_2024-05-01.md'


2025-11-14 17:01:38,380 - INFO - Going to convert document batch...
2025-11-14 17:01:38,381 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 17:01:39,569 - INFO - Finished converting document 10-Q_2024-07-31 in 1.80 sec.
2025-11-14 17:01:40,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-Q_2024-07-31' --> 'data\processed_data\MA\10-Q_2024-07-31.md'


2025-11-14 17:01:41,353 - INFO - Going to convert document batch...
2025-11-14 17:01:41,354 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 17:01:42,404 - INFO - Finished converting document 10-Q_2024-10-31 in 2.05 sec.
2025-11-14 17:01:43,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-Q_2024-10-31' --> 'data\processed_data\MA\10-Q_2024-10-31.md'


2025-11-14 17:01:44,224 - INFO - Going to convert document batch...
2025-11-14 17:01:44,225 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 17:01:45,233 - INFO - Finished converting document 10-Q_2025-05-01 in 1.98 sec.
2025-11-14 17:01:45,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-Q_2025-05-01' --> 'data\processed_data\MA\10-Q_2025-05-01.md'


2025-11-14 17:01:46,516 - INFO - Going to convert document batch...
2025-11-14 17:01:46,517 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 17:01:48,281 - INFO - Finished converting document 10-Q_2025-07-31 in 2.39 sec.
2025-11-14 17:01:49,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\10-Q_2025-07-31' --> 'data\processed_data\MA\10-Q_2025-07-31.md'


2025-11-14 17:01:49,589 - INFO - Going to convert document batch...
2025-11-14 17:01:49,590 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 17:01:50,756 - INFO - Finished converting document 10-Q_2025-10-30 in 1.81 sec.
2025-11-14 17:01:51,700 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:51,711 - INFO - Going to convert document batch...
2025-11-14 17:01:51,712 - INFO - Processing document 4_2023-01-10
2025-11-14 17:01:51,742 - INFO - Finished converting document 4_2023-01-10 in 0.05 sec.
2025-11-14 17:01:51,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:51,820 - INFO - Going to convert document batch...
2025-11-14 17:01:51,821 - INFO - Processing document 4_2023-01-12
2025-11-14 17:01:51,845 - INFO - Finished converting document 4_2023-01-12 in 0.06 sec.


Converted 'data\edgar_documents\MA\10-Q_2025-10-30' --> 'data\processed_data\MA\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\MA\4_2023-01-10' --> 'data\processed_data\MA\4_2023-01-10.md'
Converted 'data\edgar_documents\MA\4_2023-01-12' --> 'data\processed_data\MA\4_2023-01-12.md'


2025-11-14 17:01:51,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:51,920 - INFO - Going to convert document batch...
2025-11-14 17:01:51,921 - INFO - Processing document 4_2023-01-30
2025-11-14 17:01:51,968 - INFO - Finished converting document 4_2023-01-30 in 0.09 sec.
2025-11-14 17:01:52,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:52,063 - INFO - Going to convert document batch...
2025-11-14 17:01:52,065 - INFO - Processing document 4_2023-02-08
2025-11-14 17:01:52,089 - INFO - Finished converting document 4_2023-02-08 in 0.09 sec.
2025-11-14 17:01:52,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:52,147 - INFO - Going to convert document batch...
2025-11-14 17:01:52,147 - INFO - Processing document 4_2023-02-10
2025-11-14 17:01:52,170 - INFO - Finished converting document 4_2023-02-10 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2023-01-30' --> 'data\processed_data\MA\4_2023-01-30.md'
Converted 'data\edgar_documents\MA\4_2023-02-08' --> 'data\processed_data\MA\4_2023-02-08.md'


2025-11-14 17:01:52,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:52,231 - INFO - Going to convert document batch...
2025-11-14 17:01:52,232 - INFO - Processing document 4_2023-02-14
2025-11-14 17:01:52,348 - INFO - Finished converting document 4_2023-02-14 in 0.16 sec.


Converted 'data\edgar_documents\MA\4_2023-02-10' --> 'data\processed_data\MA\4_2023-02-10.md'


2025-11-14 17:01:52,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:52,439 - INFO - Going to convert document batch...
2025-11-14 17:01:52,440 - INFO - Processing document 4_2023-02-28
2025-11-14 17:01:52,475 - INFO - Finished converting document 4_2023-02-28 in 0.09 sec.
2025-11-14 17:01:52,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:52,537 - INFO - Going to convert document batch...
2025-11-14 17:01:52,538 - INFO - Processing document 4_2023-03-03
2025-11-14 17:01:52,565 - INFO - Finished converting document 4_2023-03-03 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2023-02-14' --> 'data\processed_data\MA\4_2023-02-14.md'
Converted 'data\edgar_documents\MA\4_2023-02-28' --> 'data\processed_data\MA\4_2023-02-28.md'


2025-11-14 17:01:52,634 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:01:52,635 - ERROR - Input document 4_2023-03-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:01:52,637 - INFO - Going to convert document batch...
2025-11-14 17:01:52,662 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:01:52,663 - ERROR - Input document 4_2023-03-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\MA\4_2023-03-03' --> 'data\processed_data\MA\4_2023-03-03.md'
Error processing data\edgar_documents\MA\4_2023-03-06: File format not allowed: data\edgar_documents\MA\4_2023-03-06
Error processing data\edgar_documents\MA\4_2023-03-08: File format not allowed: data\edgar_documents\MA\4_2023-03-08
Converted 'data\edgar_documents\MA\4_2023-05-04' --> 'data\processed_data\MA\4_2023-05-04.md'


2025-11-14 17:01:52,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:52,825 - INFO - Going to convert document batch...
2025-11-14 17:01:52,827 - INFO - Processing document 4_2023-05-09
2025-11-14 17:01:52,883 - INFO - Finished converting document 4_2023-05-09 in 0.11 sec.
2025-11-14 17:01:52,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:52,941 - INFO - Going to convert document batch...
2025-11-14 17:01:52,942 - INFO - Processing document 4_2023-05-10
2025-11-14 17:01:52,977 - INFO - Finished converting document 4_2023-05-10 in 0.05 sec.
2025-11-14 17:01:53,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:53,040 - INFO - Going to convert document batch...
2025-11-14 17:01:53,041 - INFO - Processing document 4_2023-05-15
2025-11-14 17:01:53,069 - INFO - Finished converting document 4_2023-05-15 in 0.06 sec.
2025-11-14 17:01:53,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2023-05-09' --> 'data\processed_data\MA\4_2023-05-09.md'
Converted 'data\edgar_documents\MA\4_2023-05-10' --> 'data\processed_data\MA\4_2023-05-10.md'
Converted 'data\edgar_documents\MA\4_2023-05-15' --> 'data\processed_data\MA\4_2023-05-15.md'


2025-11-14 17:01:53,150 - INFO - Going to convert document batch...
2025-11-14 17:01:53,151 - INFO - Processing document 4_2023-05-17
2025-11-14 17:01:53,682 - INFO - Finished converting document 4_2023-05-17 in 0.59 sec.
2025-11-14 17:01:53,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:53,783 - INFO - Going to convert document batch...
2025-11-14 17:01:53,784 - INFO - Processing document 4_2023-05-19
2025-11-14 17:01:53,813 - INFO - Finished converting document 4_2023-05-19 in 0.09 sec.
2025-11-14 17:01:53,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:53,881 - INFO - Going to convert document batch...
2025-11-14 17:01:53,882 - INFO - Processing document 4_2023-06-14
2025-11-14 17:01:53,921 - INFO - Finished converting document 4_2023-06-14 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2023-05-17' --> 'data\processed_data\MA\4_2023-05-17.md'
Converted 'data\edgar_documents\MA\4_2023-05-19' --> 'data\processed_data\MA\4_2023-05-19.md'


2025-11-14 17:01:53,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:53,999 - INFO - Going to convert document batch...
2025-11-14 17:01:53,999 - INFO - Processing document 4_2023-06-26
2025-11-14 17:01:54,022 - INFO - Finished converting document 4_2023-06-26 in 0.06 sec.
2025-11-14 17:01:54,071 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:54,082 - INFO - Going to convert document batch...
2025-11-14 17:01:54,083 - INFO - Processing document 4_2023-06-29
2025-11-14 17:01:54,107 - INFO - Finished converting document 4_2023-06-29 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2023-06-14' --> 'data\processed_data\MA\4_2023-06-14.md'
Converted 'data\edgar_documents\MA\4_2023-06-26' --> 'data\processed_data\MA\4_2023-06-26.md'


2025-11-14 17:01:54,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:54,178 - INFO - Going to convert document batch...
2025-11-14 17:01:54,179 - INFO - Processing document 4_2023-07-05
2025-11-14 17:01:54,214 - INFO - Finished converting document 4_2023-07-05 in 0.08 sec.
2025-11-14 17:01:54,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:54,285 - INFO - Going to convert document batch...
2025-11-14 17:01:54,285 - INFO - Processing document 4_2023-07-13
2025-11-14 17:01:54,311 - INFO - Finished converting document 4_2023-07-13 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2023-06-29' --> 'data\processed_data\MA\4_2023-06-29.md'
Converted 'data\edgar_documents\MA\4_2023-07-05' --> 'data\processed_data\MA\4_2023-07-05.md'


2025-11-14 17:01:54,354 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:54,370 - INFO - Going to convert document batch...
2025-11-14 17:01:54,371 - INFO - Processing document 4_2023-08-03
2025-11-14 17:01:54,419 - INFO - Finished converting document 4_2023-08-03 in 0.08 sec.
2025-11-14 17:01:54,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:54,531 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MA\4_2023-07-13' --> 'data\processed_data\MA\4_2023-07-13.md'
Converted 'data\edgar_documents\MA\4_2023-08-03' --> 'data\processed_data\MA\4_2023-08-03.md'


2025-11-14 17:01:54,532 - INFO - Processing document 4_2023-08-10
2025-11-14 17:01:54,564 - INFO - Finished converting document 4_2023-08-10 in 0.09 sec.
2025-11-14 17:01:54,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:54,646 - INFO - Going to convert document batch...
2025-11-14 17:01:54,647 - INFO - Processing document 4_2023-08-15
2025-11-14 17:01:54,684 - INFO - Finished converting document 4_2023-08-15 in 0.08 sec.
2025-11-14 17:01:54,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:54,748 - INFO - Going to convert document batch...
2025-11-14 17:01:54,748 - INFO - Processing document 4_2023-08-17
2025-11-14 17:01:54,777 - INFO - Finished converting document 4_2023-08-17 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2023-08-10' --> 'data\processed_data\MA\4_2023-08-10.md'
Converted 'data\edgar_documents\MA\4_2023-08-15' --> 'data\processed_data\MA\4_2023-08-15.md'
Converted 'data\edgar_documents\MA\4_2023-08-17' --> 'data\processed_data\MA\4_2023-08-17.md'


2025-11-14 17:01:54,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:54,847 - INFO - Going to convert document batch...
2025-11-14 17:01:54,848 - INFO - Processing document 4_2023-08-30
2025-11-14 17:01:54,907 - INFO - Finished converting document 4_2023-08-30 in 0.09 sec.
2025-11-14 17:01:54,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:54,988 - INFO - Going to convert document batch...
2025-11-14 17:01:54,990 - INFO - Processing document 4_2023-08-31
2025-11-14 17:01:55,032 - INFO - Finished converting document 4_2023-08-31 in 0.08 sec.
2025-11-14 17:01:55,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:55,126 - INFO - Going to convert document batch...
2025-11-14 17:01:55,127 - INFO - Processing document 4_2023-09-05


Converted 'data\edgar_documents\MA\4_2023-08-30' --> 'data\processed_data\MA\4_2023-08-30.md'
Converted 'data\edgar_documents\MA\4_2023-08-31' --> 'data\processed_data\MA\4_2023-08-31.md'


2025-11-14 17:01:55,158 - INFO - Finished converting document 4_2023-09-05 in 0.08 sec.
2025-11-14 17:01:55,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:55,256 - INFO - Going to convert document batch...
2025-11-14 17:01:55,258 - INFO - Processing document 4_2023-09-18
2025-11-14 17:01:55,342 - INFO - Finished converting document 4_2023-09-18 in 0.16 sec.


Converted 'data\edgar_documents\MA\4_2023-09-05' --> 'data\processed_data\MA\4_2023-09-05.md'
Converted 'data\edgar_documents\MA\4_2023-09-18' --> 'data\processed_data\MA\4_2023-09-18.md'


2025-11-14 17:01:55,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:55,500 - INFO - Going to convert document batch...
2025-11-14 17:01:55,501 - INFO - Processing document 4_2023-09-21
2025-11-14 17:01:55,572 - INFO - Finished converting document 4_2023-09-21 in 0.19 sec.
2025-11-14 17:01:55,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:55,679 - INFO - Going to convert document batch...
2025-11-14 17:01:55,682 - INFO - Processing document 4_2023-10-03
2025-11-14 17:01:55,749 - INFO - Finished converting document 4_2023-10-03 in 0.12 sec.
2025-11-14 17:01:55,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2023-09-21' --> 'data\processed_data\MA\4_2023-09-21.md'
Converted 'data\edgar_documents\MA\4_2023-10-03' --> 'data\processed_data\MA\4_2023-10-03.md'


2025-11-14 17:01:55,826 - INFO - Going to convert document batch...
2025-11-14 17:01:55,827 - INFO - Processing document 4_2023-11-03
2025-11-14 17:01:55,861 - INFO - Finished converting document 4_2023-11-03 in 0.06 sec.
2025-11-14 17:01:55,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:55,920 - INFO - Going to convert document batch...
2025-11-14 17:01:55,921 - INFO - Processing document 4_2023-11-08
2025-11-14 17:01:55,951 - INFO - Finished converting document 4_2023-11-08 in 0.06 sec.
2025-11-14 17:01:56,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:56,016 - INFO - Going to convert document batch...
2025-11-14 17:01:56,016 - INFO - Processing document 4_2023-11-09
2025-11-14 17:01:56,040 - INFO - Finished converting document 4_2023-11-09 in 0.05 sec.


Converted 'data\edgar_documents\MA\4_2023-11-03' --> 'data\processed_data\MA\4_2023-11-03.md'
Converted 'data\edgar_documents\MA\4_2023-11-08' --> 'data\processed_data\MA\4_2023-11-08.md'
Converted 'data\edgar_documents\MA\4_2023-11-09' --> 'data\processed_data\MA\4_2023-11-09.md'


2025-11-14 17:01:56,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:56,119 - INFO - Going to convert document batch...
2025-11-14 17:01:56,120 - INFO - Processing document 4_2023-11-13
2025-11-14 17:01:56,154 - INFO - Finished converting document 4_2023-11-13 in 0.09 sec.
2025-11-14 17:01:56,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:56,209 - INFO - Going to convert document batch...
2025-11-14 17:01:56,210 - INFO - Processing document 4_2023-11-27
2025-11-14 17:01:56,230 - INFO - Finished converting document 4_2023-11-27 in 0.05 sec.
2025-11-14 17:01:56,274 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:56,283 - INFO - Going to convert document batch...
2025-11-14 17:01:56,284 - INFO - Processing document 4_2023-12-01
2025-11-14 17:01:56,305 - INFO - Finished converting document 4_2023-12-01 in 0.05 sec.
2025-11-14 17:01:56,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\MA\4_2023-11-13' --> 'data\processed_data\MA\4_2023-11-13.md'
Converted 'data\edgar_documents\MA\4_2023-11-27' --> 'data\processed_data\MA\4_2023-11-27.md'
Converted 'data\edgar_documents\MA\4_2023-12-01' --> 'data\processed_data\MA\4_2023-12-01.md'


2025-11-14 17:01:56,384 - INFO - Processing document 4_2023-12-15
2025-11-14 17:01:56,429 - INFO - Finished converting document 4_2023-12-15 in 0.09 sec.
2025-11-14 17:01:56,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:56,594 - INFO - Going to convert document batch...
2025-11-14 17:01:56,595 - INFO - Processing document 4_2024-01-04
2025-11-14 17:01:56,632 - INFO - Finished converting document 4_2024-01-04 in 0.14 sec.


Converted 'data\edgar_documents\MA\4_2023-12-15' --> 'data\processed_data\MA\4_2023-12-15.md'


2025-11-14 17:01:56,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:56,700 - INFO - Going to convert document batch...
2025-11-14 17:01:56,701 - INFO - Processing document 4_2024-01-16
2025-11-14 17:01:56,759 - INFO - Finished converting document 4_2024-01-16 in 0.08 sec.
2025-11-14 17:01:56,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:56,830 - INFO - Going to convert document batch...
2025-11-14 17:01:56,831 - INFO - Processing document 4_2024-01-23
2025-11-14 17:01:56,870 - INFO - Finished converting document 4_2024-01-23 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2024-01-04' --> 'data\processed_data\MA\4_2024-01-04.md'
Converted 'data\edgar_documents\MA\4_2024-01-16' --> 'data\processed_data\MA\4_2024-01-16.md'


2025-11-14 17:01:56,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:56,926 - INFO - Going to convert document batch...
2025-11-14 17:01:56,927 - INFO - Processing document 4_2024-02-02
2025-11-14 17:01:56,964 - INFO - Finished converting document 4_2024-02-02 in 0.06 sec.
2025-11-14 17:01:57,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:57,028 - INFO - Going to convert document batch...
2025-11-14 17:01:57,028 - INFO - Processing document 4_2024-02-20
2025-11-14 17:01:57,063 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2024-01-23' --> 'data\processed_data\MA\4_2024-01-23.md'
Converted 'data\edgar_documents\MA\4_2024-02-02' --> 'data\processed_data\MA\4_2024-02-02.md'


2025-11-14 17:01:57,108 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:57,132 - INFO - Going to convert document batch...
2025-11-14 17:01:57,133 - INFO - Processing document 4_2024-02-29
2025-11-14 17:01:57,183 - INFO - Finished converting document 4_2024-02-29 in 0.09 sec.
2025-11-14 17:01:57,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2024-02-20' --> 'data\processed_data\MA\4_2024-02-20.md'
Converted 'data\edgar_documents\MA\4_2024-02-29' --> 'data\processed_data\MA\4_2024-02-29.md'


2025-11-14 17:01:57,299 - INFO - Going to convert document batch...
2025-11-14 17:01:57,300 - INFO - Processing document 4_2024-03-05
2025-11-14 17:01:57,386 - INFO - Finished converting document 4_2024-03-05 in 0.17 sec.
2025-11-14 17:01:57,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:57,480 - INFO - Going to convert document batch...
2025-11-14 17:01:57,480 - INFO - Processing document 4_2024-03-12
2025-11-14 17:01:57,503 - INFO - Finished converting document 4_2024-03-12 in 0.08 sec.
2025-11-14 17:01:57,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:57,553 - INFO - Going to convert document batch...
2025-11-14 17:01:57,553 - INFO - Processing document 4_2024-03-19
2025-11-14 17:01:57,584 - INFO - Finished converting document 4_2024-03-19 in 0.05 sec.


Converted 'data\edgar_documents\MA\4_2024-03-05' --> 'data\processed_data\MA\4_2024-03-05.md'
Converted 'data\edgar_documents\MA\4_2024-03-12' --> 'data\processed_data\MA\4_2024-03-12.md'


2025-11-14 17:01:57,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:57,640 - INFO - Going to convert document batch...
2025-11-14 17:01:57,641 - INFO - Processing document 4_2024-03-22
2025-11-14 17:01:57,677 - INFO - Finished converting document 4_2024-03-22 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2024-03-19' --> 'data\processed_data\MA\4_2024-03-19.md'
Converted 'data\edgar_documents\MA\4_2024-03-22' --> 'data\processed_data\MA\4_2024-03-22.md'


2025-11-14 17:01:57,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:57,848 - INFO - Going to convert document batch...
2025-11-14 17:01:57,849 - INFO - Processing document 4_2024-04-11
2025-11-14 17:01:57,879 - INFO - Finished converting document 4_2024-04-11 in 0.08 sec.
2025-11-14 17:01:57,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:57,930 - INFO - Going to convert document batch...
2025-11-14 17:01:57,932 - INFO - Processing document 4_2024-04-16
2025-11-14 17:01:57,953 - INFO - Finished converting document 4_2024-04-16 in 0.05 sec.
2025-11-14 17:01:58,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:58,021 - INFO - Going to convert document batch...
2025-11-14 17:01:58,022 - INFO - Processing document 4_2024-04-19
2025-11-14 17:01:58,055 - INFO - Finished converting document 4_2024-04-19 in 0.06 sec.
2025-11-14 17:01:58,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2024-04-11' --> 'data\processed_data\MA\4_2024-04-11.md'
Converted 'data\edgar_documents\MA\4_2024-04-16' --> 'data\processed_data\MA\4_2024-04-16.md'
Converted 'data\edgar_documents\MA\4_2024-04-19' --> 'data\processed_data\MA\4_2024-04-19.md'


2025-11-14 17:01:58,106 - INFO - Going to convert document batch...
2025-11-14 17:01:58,107 - INFO - Processing document 4_2024-04-22
2025-11-14 17:01:58,155 - INFO - Finished converting document 4_2024-04-22 in 0.08 sec.
2025-11-14 17:01:58,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:58,232 - INFO - Going to convert document batch...
2025-11-14 17:01:58,233 - INFO - Processing document 4_2024-04-23
2025-11-14 17:01:58,269 - INFO - Finished converting document 4_2024-04-23 in 0.08 sec.
2025-11-14 17:01:58,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:58,332 - INFO - Going to convert document batch...
2025-11-14 17:01:58,333 - INFO - Processing document 4_2024-04-24
2025-11-14 17:01:58,365 - INFO - Finished converting document 4_2024-04-24 in 0.05 sec.


Converted 'data\edgar_documents\MA\4_2024-04-22' --> 'data\processed_data\MA\4_2024-04-22.md'
Converted 'data\edgar_documents\MA\4_2024-04-23' --> 'data\processed_data\MA\4_2024-04-23.md'


2025-11-14 17:01:58,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:58,423 - INFO - Going to convert document batch...
2025-11-14 17:01:58,425 - INFO - Processing document 4_2024-04-25
2025-11-14 17:01:58,472 - INFO - Finished converting document 4_2024-04-25 in 0.08 sec.
2025-11-14 17:01:58,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2024-04-24' --> 'data\processed_data\MA\4_2024-04-24.md'
Converted 'data\edgar_documents\MA\4_2024-04-25' --> 'data\processed_data\MA\4_2024-04-25.md'


2025-11-14 17:01:58,613 - INFO - Going to convert document batch...
2025-11-14 17:01:58,614 - INFO - Processing document 4_2024-04-26
2025-11-14 17:01:58,650 - INFO - Finished converting document 4_2024-04-26 in 0.08 sec.
2025-11-14 17:01:58,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:58,709 - INFO - Going to convert document batch...
2025-11-14 17:01:58,710 - INFO - Processing document 4_2024-04-29
2025-11-14 17:01:58,740 - INFO - Finished converting document 4_2024-04-29 in 0.05 sec.
2025-11-14 17:01:58,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:58,795 - INFO - Going to convert document batch...
2025-11-14 17:01:58,796 - INFO - Processing document 4_2024-05-02


Converted 'data\edgar_documents\MA\4_2024-04-26' --> 'data\processed_data\MA\4_2024-04-26.md'
Converted 'data\edgar_documents\MA\4_2024-04-29' --> 'data\processed_data\MA\4_2024-04-29.md'


2025-11-14 17:01:59,103 - INFO - Finished converting document 4_2024-05-02 in 0.33 sec.
2025-11-14 17:01:59,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:59,199 - INFO - Going to convert document batch...
2025-11-14 17:01:59,200 - INFO - Processing document 4_2024-05-03


Converted 'data\edgar_documents\MA\4_2024-05-02' --> 'data\processed_data\MA\4_2024-05-02.md'


2025-11-14 17:01:59,344 - INFO - Finished converting document 4_2024-05-03 in 0.20 sec.
2025-11-14 17:01:59,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:59,434 - INFO - Going to convert document batch...
2025-11-14 17:01:59,434 - INFO - Processing document 4_2024-05-06
2025-11-14 17:01:59,473 - INFO - Finished converting document 4_2024-05-06 in 0.09 sec.
2025-11-14 17:01:59,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:59,531 - INFO - Going to convert document batch...
2025-11-14 17:01:59,532 - INFO - Processing document 4_2024-05-07
2025-11-14 17:01:59,560 - INFO - Finished converting document 4_2024-05-07 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2024-05-03' --> 'data\processed_data\MA\4_2024-05-03.md'
Converted 'data\edgar_documents\MA\4_2024-05-06' --> 'data\processed_data\MA\4_2024-05-06.md'


2025-11-14 17:01:59,601 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:59,615 - INFO - Going to convert document batch...
2025-11-14 17:01:59,616 - INFO - Processing document 4_2024-05-08
2025-11-14 17:01:59,719 - INFO - Finished converting document 4_2024-05-08 in 0.14 sec.


Converted 'data\edgar_documents\MA\4_2024-05-07' --> 'data\processed_data\MA\4_2024-05-07.md'


2025-11-14 17:01:59,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:01:59,805 - INFO - Going to convert document batch...
2025-11-14 17:01:59,806 - INFO - Processing document 4_2024-05-09
2025-11-14 17:01:59,852 - INFO - Finished converting document 4_2024-05-09 in 0.08 sec.
2025-11-14 17:01:59,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2024-05-08' --> 'data\processed_data\MA\4_2024-05-08.md'
Converted 'data\edgar_documents\MA\4_2024-05-09' --> 'data\processed_data\MA\4_2024-05-09.md'


2025-11-14 17:01:59,974 - INFO - Going to convert document batch...
2025-11-14 17:01:59,975 - INFO - Processing document 4_2024-05-10
2025-11-14 17:02:00,009 - INFO - Finished converting document 4_2024-05-10 in 0.06 sec.
2025-11-14 17:02:00,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:00,081 - INFO - Going to convert document batch...
2025-11-14 17:02:00,082 - INFO - Processing document 4_2024-05-13
2025-11-14 17:02:00,116 - INFO - Finished converting document 4_2024-05-13 in 0.06 sec.
2025-11-14 17:02:00,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:00,175 - INFO - Going to convert document batch...
2025-11-14 17:02:00,176 - INFO - Processing document 4_2024-05-14
2025-11-14 17:02:00,209 - INFO - Finished converting document 4_2024-05-14 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2024-05-10' --> 'data\processed_data\MA\4_2024-05-10.md'
Converted 'data\edgar_documents\MA\4_2024-05-13' --> 'data\processed_data\MA\4_2024-05-13.md'


2025-11-14 17:02:00,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:00,262 - INFO - Going to convert document batch...
2025-11-14 17:02:00,263 - INFO - Processing document 4_2024-05-15
2025-11-14 17:02:00,290 - INFO - Finished converting document 4_2024-05-15 in 0.05 sec.
2025-11-14 17:02:00,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:00,346 - INFO - Going to convert document batch...
2025-11-14 17:02:00,346 - INFO - Processing document 4_2024-05-16
2025-11-14 17:02:00,378 - INFO - Finished converting document 4_2024-05-16 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2024-05-14' --> 'data\processed_data\MA\4_2024-05-14.md'
Converted 'data\edgar_documents\MA\4_2024-05-15' --> 'data\processed_data\MA\4_2024-05-15.md'
Converted 'data\edgar_documents\MA\4_2024-05-16' --> 'data\processed_data\MA\4_2024-05-16.md'


2025-11-14 17:02:00,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:00,442 - INFO - Going to convert document batch...
2025-11-14 17:02:00,443 - INFO - Processing document 4_2024-05-17
2025-11-14 17:02:00,562 - INFO - Finished converting document 4_2024-05-17 in 0.16 sec.
2025-11-14 17:02:00,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:00,629 - INFO - Going to convert document batch...
2025-11-14 17:02:00,630 - INFO - Processing document 4_2024-05-20
2025-11-14 17:02:00,661 - INFO - Finished converting document 4_2024-05-20 in 0.05 sec.
2025-11-14 17:02:00,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:00,722 - INFO - Going to convert document batch...
2025-11-14 17:02:00,725 - INFO - Processing document 4_2024-05-21
2025-11-14 17:02:00,756 - INFO - Finished converting document 4_2024-05-21 in 0.06 sec.
2025-11-14 17:02:00,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2024-05-17' --> 'data\processed_data\MA\4_2024-05-17.md'
Converted 'data\edgar_documents\MA\4_2024-05-20' --> 'data\processed_data\MA\4_2024-05-20.md'
Converted 'data\edgar_documents\MA\4_2024-05-21' --> 'data\processed_data\MA\4_2024-05-21.md'


2025-11-14 17:02:00,813 - INFO - Going to convert document batch...
2025-11-14 17:02:00,814 - INFO - Processing document 4_2024-05-23
2025-11-14 17:02:00,852 - INFO - Finished converting document 4_2024-05-23 in 0.06 sec.
2025-11-14 17:02:00,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:00,919 - INFO - Going to convert document batch...
2025-11-14 17:02:00,919 - INFO - Processing document 4_2024-05-24
2025-11-14 17:02:00,949 - INFO - Finished converting document 4_2024-05-24 in 0.06 sec.
2025-11-14 17:02:00,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:01,006 - INFO - Going to convert document batch...
2025-11-14 17:02:01,008 - INFO - Processing document 4_2024-05-28
2025-11-14 17:02:01,037 - INFO - Finished converting document 4_2024-05-28 in 0.05 sec.
2025-11-14 17:02:01,079 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2024-05-23' --> 'data\processed_data\MA\4_2024-05-23.md'
Converted 'data\edgar_documents\MA\4_2024-05-24' --> 'data\processed_data\MA\4_2024-05-24.md'
Converted 'data\edgar_documents\MA\4_2024-05-28' --> 'data\processed_data\MA\4_2024-05-28.md'


2025-11-14 17:02:01,094 - INFO - Going to convert document batch...
2025-11-14 17:02:01,095 - INFO - Processing document 4_2024-05-29
2025-11-14 17:02:01,133 - INFO - Finished converting document 4_2024-05-29 in 0.06 sec.
2025-11-14 17:02:01,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:01,201 - INFO - Going to convert document batch...
2025-11-14 17:02:01,202 - INFO - Processing document 4_2024-05-30
2025-11-14 17:02:01,249 - INFO - Finished converting document 4_2024-05-30 in 0.08 sec.
2025-11-14 17:02:01,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:01,315 - INFO - Going to convert document batch...
2025-11-14 17:02:01,316 - INFO - Processing document 4_2024-05-31
2025-11-14 17:02:01,354 - INFO - Finished converting document 4_2024-05-31 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2024-05-29' --> 'data\processed_data\MA\4_2024-05-29.md'
Converted 'data\edgar_documents\MA\4_2024-05-30' --> 'data\processed_data\MA\4_2024-05-30.md'


2025-11-14 17:02:01,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:01,413 - INFO - Going to convert document batch...
2025-11-14 17:02:01,414 - INFO - Processing document 4_2024-06-03
2025-11-14 17:02:01,451 - INFO - Finished converting document 4_2024-06-03 in 0.08 sec.
2025-11-14 17:02:01,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:01,522 - INFO - Going to convert document batch...
2025-11-14 17:02:01,522 - INFO - Processing document 4_2024-06-04
2025-11-14 17:02:01,569 - INFO - Finished converting document 4_2024-06-04 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2024-05-31' --> 'data\processed_data\MA\4_2024-05-31.md'
Converted 'data\edgar_documents\MA\4_2024-06-03' --> 'data\processed_data\MA\4_2024-06-03.md'


2025-11-14 17:02:01,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:01,628 - INFO - Going to convert document batch...
2025-11-14 17:02:01,628 - INFO - Processing document 4_2024-06-05
2025-11-14 17:02:01,663 - INFO - Finished converting document 4_2024-06-05 in 0.06 sec.
2025-11-14 17:02:01,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:01,719 - INFO - Going to convert document batch...
2025-11-14 17:02:01,720 - INFO - Processing document 4_2024-06-06
2025-11-14 17:02:01,743 - INFO - Finished converting document 4_2024-06-06 in 0.05 sec.
2025-11-14 17:02:01,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2024-06-04' --> 'data\processed_data\MA\4_2024-06-04.md'
Converted 'data\edgar_documents\MA\4_2024-06-05' --> 'data\processed_data\MA\4_2024-06-05.md'
Converted 'data\edgar_documents\MA\4_2024-06-06' --> 'data\processed_data\MA\4_2024-06-06.md'


2025-11-14 17:02:01,796 - INFO - Going to convert document batch...
2025-11-14 17:02:01,797 - INFO - Processing document 4_2024-06-07
2025-11-14 17:02:01,835 - INFO - Finished converting document 4_2024-06-07 in 0.06 sec.
2025-11-14 17:02:01,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:01,905 - INFO - Going to convert document batch...
2025-11-14 17:02:01,906 - INFO - Processing document 4_2024-06-10
2025-11-14 17:02:02,020 - INFO - Finished converting document 4_2024-06-10 in 0.06 sec.
2025-11-14 17:02:02,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2024-06-07' --> 'data\processed_data\MA\4_2024-06-07.md'
Converted 'data\edgar_documents\MA\4_2024-06-10' --> 'data\processed_data\MA\4_2024-06-10.md'


2025-11-14 17:02:02,085 - INFO - Going to convert document batch...
2025-11-14 17:02:02,086 - INFO - Processing document 4_2024-06-11
2025-11-14 17:02:02,119 - INFO - Finished converting document 4_2024-06-11 in 0.05 sec.
2025-11-14 17:02:02,167 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:02,185 - INFO - Going to convert document batch...
2025-11-14 17:02:02,186 - INFO - Processing document 4_2024-06-12
2025-11-14 17:02:02,217 - INFO - Finished converting document 4_2024-06-12 in 0.06 sec.
2025-11-14 17:02:02,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:02,294 - INFO - Going to convert document batch...
2025-11-14 17:02:02,295 - INFO - Processing document 4_2024-06-13
2025-11-14 17:02:02,330 - INFO - Finished converting document 4_2024-06-13 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2024-06-11' --> 'data\processed_data\MA\4_2024-06-11.md'
Converted 'data\edgar_documents\MA\4_2024-06-12' --> 'data\processed_data\MA\4_2024-06-12.md'
Converted 'data\edgar_documents\MA\4_2024-06-13' --> 'data\processed_data\MA\4_2024-06-13.md'


2025-11-14 17:02:02,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:02,398 - INFO - Going to convert document batch...
2025-11-14 17:02:02,399 - INFO - Processing document 4_2024-06-14
2025-11-14 17:02:02,444 - INFO - Finished converting document 4_2024-06-14 in 0.08 sec.
2025-11-14 17:02:02,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:02,614 - INFO - Going to convert document batch...
2025-11-14 17:02:02,616 - INFO - Processing document 4_2024-06-17
2025-11-14 17:02:02,648 - INFO - Finished converting document 4_2024-06-17 in 0.06 sec.
2025-11-14 17:02:02,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:02,724 - INFO - Going to convert document batch...
2025-11-14 17:02:02,725 - INFO - Processing document 4_2024-06-18
2025-11-14 17:02:02,760 - INFO - Finished converting document 4_2024-06-18 in 0.09 sec.


Converted 'data\edgar_documents\MA\4_2024-06-14' --> 'data\processed_data\MA\4_2024-06-14.md'
Converted 'data\edgar_documents\MA\4_2024-06-17' --> 'data\processed_data\MA\4_2024-06-17.md'


2025-11-14 17:02:02,848 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:02,863 - INFO - Going to convert document batch...
2025-11-14 17:02:02,864 - INFO - Processing document 4_2024-06-20
2025-11-14 17:02:02,904 - INFO - Finished converting document 4_2024-06-20 in 0.11 sec.
2025-11-14 17:02:02,950 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:02,959 - INFO - Going to convert document batch...
2025-11-14 17:02:02,960 - INFO - Processing document 4_2024-06-21
2025-11-14 17:02:02,980 - INFO - Finished converting document 4_2024-06-21 in 0.05 sec.


Converted 'data\edgar_documents\MA\4_2024-06-18' --> 'data\processed_data\MA\4_2024-06-18.md'
Converted 'data\edgar_documents\MA\4_2024-06-20' --> 'data\processed_data\MA\4_2024-06-20.md'


2025-11-14 17:02:03,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:03,092 - INFO - Going to convert document batch...
2025-11-14 17:02:03,093 - INFO - Processing document 4_2024-06-24
2025-11-14 17:02:03,147 - INFO - Finished converting document 4_2024-06-24 in 0.14 sec.


Converted 'data\edgar_documents\MA\4_2024-06-21' --> 'data\processed_data\MA\4_2024-06-21.md'
Converted 'data\edgar_documents\MA\4_2024-06-24' --> 'data\processed_data\MA\4_2024-06-24.md'


2025-11-14 17:02:03,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:03,257 - INFO - Going to convert document batch...
2025-11-14 17:02:03,259 - INFO - Processing document 4_2024-06-25
2025-11-14 17:02:03,294 - INFO - Finished converting document 4_2024-06-25 in 0.11 sec.
2025-11-14 17:02:03,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:03,407 - INFO - Going to convert document batch...
2025-11-14 17:02:03,408 - INFO - Processing document 4_2024-06-26
2025-11-14 17:02:03,449 - INFO - Finished converting document 4_2024-06-26 in 0.12 sec.
2025-11-14 17:02:03,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:03,519 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MA\4_2024-06-25' --> 'data\processed_data\MA\4_2024-06-25.md'
Converted 'data\edgar_documents\MA\4_2024-06-26' --> 'data\processed_data\MA\4_2024-06-26.md'


2025-11-14 17:02:03,519 - INFO - Processing document 4_2024-06-27
2025-11-14 17:02:03,559 - INFO - Finished converting document 4_2024-06-27 in 0.09 sec.
2025-11-14 17:02:03,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:03,662 - INFO - Going to convert document batch...
2025-11-14 17:02:03,663 - INFO - Processing document 4_2024-08-05
2025-11-14 17:02:03,688 - INFO - Finished converting document 4_2024-08-05 in 0.09 sec.
2025-11-14 17:02:03,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:03,766 - INFO - Going to convert document batch...
2025-11-14 17:02:03,767 - INFO - Processing document 4_2024-08-06
2025-11-14 17:02:03,803 - INFO - Finished converting document 4_2024-08-06 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2024-06-27' --> 'data\processed_data\MA\4_2024-06-27.md'
Converted 'data\edgar_documents\MA\4_2024-08-05' --> 'data\processed_data\MA\4_2024-08-05.md'


2025-11-14 17:02:03,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:03,879 - INFO - Going to convert document batch...
2025-11-14 17:02:03,880 - INFO - Processing document 4_2024-08-19
2025-11-14 17:02:03,910 - INFO - Finished converting document 4_2024-08-19 in 0.08 sec.
2025-11-14 17:02:03,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:03,976 - INFO - Going to convert document batch...
2025-11-14 17:02:03,977 - INFO - Processing document 4_2024-08-20
2025-11-14 17:02:04,012 - INFO - Finished converting document 4_2024-08-20 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2024-08-06' --> 'data\processed_data\MA\4_2024-08-06.md'
Converted 'data\edgar_documents\MA\4_2024-08-19' --> 'data\processed_data\MA\4_2024-08-19.md'


2025-11-14 17:02:04,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:04,124 - INFO - Going to convert document batch...
2025-11-14 17:02:04,126 - INFO - Processing document 4_2024-08-21
2025-11-14 17:02:04,190 - INFO - Finished converting document 4_2024-08-21 in 0.14 sec.


Converted 'data\edgar_documents\MA\4_2024-08-20' --> 'data\processed_data\MA\4_2024-08-20.md'
Converted 'data\edgar_documents\MA\4_2024-08-21' --> 'data\processed_data\MA\4_2024-08-21.md'


2025-11-14 17:02:04,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:04,279 - INFO - Going to convert document batch...
2025-11-14 17:02:04,280 - INFO - Processing document 4_2024-08-22
2025-11-14 17:02:04,591 - INFO - Finished converting document 4_2024-08-22 in 0.38 sec.
2025-11-14 17:02:04,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:04,667 - INFO - Going to convert document batch...
2025-11-14 17:02:04,668 - INFO - Processing document 4_2024-08-23
2025-11-14 17:02:04,699 - INFO - Finished converting document 4_2024-08-23 in 0.06 sec.
2025-11-14 17:02:04,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:04,751 - INFO - Going to convert document batch...
2025-11-14 17:02:04,752 - INFO - Processing document 4_2024-08-30
2025-11-14 17:02:04,775 - INFO - Finished converting document 4_2024-08-30 in 0.05 sec.
2025-11-14 17:02:04,824 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\MA\4_2024-08-22' --> 'data\processed_data\MA\4_2024-08-22.md'
Converted 'data\edgar_documents\MA\4_2024-08-23' --> 'data\processed_data\MA\4_2024-08-23.md'
Converted 'data\edgar_documents\MA\4_2024-08-30' --> 'data\processed_data\MA\4_2024-08-30.md'


2025-11-14 17:02:04,825 - ERROR - Input document 4_2024-09-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:02:04,827 - INFO - Going to convert document batch...
2025-11-14 17:02:04,854 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:02:04,854 - ERROR - Input document 4_2024-09-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\MA\4_2024-09-03: File format not allowed: data\edgar_documents\MA\4_2024-09-03
Error processing data\edgar_documents\MA\4_2024-09-04: File format not allowed: data\edgar_documents\MA\4_2024-09-04


2025-11-14 17:02:05,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:05,074 - INFO - Going to convert document batch...
2025-11-14 17:02:05,075 - INFO - Processing document 4_2024-09-18
2025-11-14 17:02:05,100 - INFO - Finished converting document 4_2024-09-18 in 0.05 sec.
2025-11-14 17:02:05,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:05,150 - INFO - Going to convert document batch...
2025-11-14 17:02:05,151 - INFO - Processing document 4_2024-09-23
2025-11-14 17:02:05,182 - INFO - Finished converting document 4_2024-09-23 in 0.05 sec.
2025-11-14 17:02:05,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2024-09-17' --> 'data\processed_data\MA\4_2024-09-17.md'
Converted 'data\edgar_documents\MA\4_2024-09-18' --> 'data\processed_data\MA\4_2024-09-18.md'
Converted 'data\edgar_documents\MA\4_2024-09-23' --> 'data\processed_data\MA\4_2024-09-23.md'


2025-11-14 17:02:05,254 - INFO - Going to convert document batch...
2025-11-14 17:02:05,257 - INFO - Processing document 4_2024-10-01
2025-11-14 17:02:05,394 - INFO - Finished converting document 4_2024-10-01 in 0.19 sec.
2025-11-14 17:02:05,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:05,481 - INFO - Going to convert document batch...
2025-11-14 17:02:05,482 - INFO - Processing document 4_2024-10-03
2025-11-14 17:02:05,511 - INFO - Finished converting document 4_2024-10-03 in 0.09 sec.
2025-11-14 17:02:05,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:05,588 - INFO - Going to convert document batch...
2025-11-14 17:02:05,589 - INFO - Processing document 4_2024-11-04
2025-11-14 17:02:05,613 - INFO - Finished converting document 4_2024-11-04 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2024-10-01' --> 'data\processed_data\MA\4_2024-10-01.md'
Converted 'data\edgar_documents\MA\4_2024-10-03' --> 'data\processed_data\MA\4_2024-10-03.md'


2025-11-14 17:02:05,666 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:05,677 - INFO - Going to convert document batch...
2025-11-14 17:02:05,680 - INFO - Processing document 4_2024-12-09
2025-11-14 17:02:05,702 - INFO - Finished converting document 4_2024-12-09 in 0.06 sec.
2025-11-14 17:02:05,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:05,750 - INFO - Going to convert document batch...
2025-11-14 17:02:05,750 - INFO - Processing document 4_2025-02-03
2025-11-14 17:02:05,772 - INFO - Finished converting document 4_2025-02-03 in 0.05 sec.


Converted 'data\edgar_documents\MA\4_2024-11-04' --> 'data\processed_data\MA\4_2024-11-04.md'
Converted 'data\edgar_documents\MA\4_2024-12-09' --> 'data\processed_data\MA\4_2024-12-09.md'


2025-11-14 17:02:05,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:05,935 - INFO - Going to convert document batch...
2025-11-14 17:02:05,936 - INFO - Processing document 4_2025-02-18
2025-11-14 17:02:05,961 - INFO - Finished converting document 4_2025-02-18 in 0.08 sec.
2025-11-14 17:02:06,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:06,026 - INFO - Going to convert document batch...
2025-11-14 17:02:06,027 - INFO - Processing document 4_2025-02-20
2025-11-14 17:02:06,067 - INFO - Finished converting document 4_2025-02-20 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2025-02-03' --> 'data\processed_data\MA\4_2025-02-03.md'
Converted 'data\edgar_documents\MA\4_2025-02-18' --> 'data\processed_data\MA\4_2025-02-18.md'


2025-11-14 17:02:06,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:06,149 - INFO - Going to convert document batch...
2025-11-14 17:02:06,150 - INFO - Processing document 4_2025-02-27
2025-11-14 17:02:06,191 - INFO - Finished converting document 4_2025-02-27 in 0.09 sec.
2025-11-14 17:02:06,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2025-02-20' --> 'data\processed_data\MA\4_2025-02-20.md'
Converted 'data\edgar_documents\MA\4_2025-02-27' --> 'data\processed_data\MA\4_2025-02-27.md'


2025-11-14 17:02:06,313 - INFO - Going to convert document batch...
2025-11-14 17:02:06,315 - INFO - Processing document 4_2025-03-04
2025-11-14 17:02:06,352 - INFO - Finished converting document 4_2025-03-04 in 0.11 sec.
2025-11-14 17:02:06,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:06,426 - INFO - Going to convert document batch...
2025-11-14 17:02:06,427 - INFO - Processing document 4_2025-03-06
2025-11-14 17:02:06,468 - INFO - Finished converting document 4_2025-03-06 in 0.08 sec.
2025-11-14 17:02:06,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:06,532 - INFO - Going to convert document batch...
2025-11-14 17:02:06,532 - INFO - Processing document 4_2025-03-20
2025-11-14 17:02:06,571 - INFO - Finished converting document 4_2025-03-20 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2025-03-04' --> 'data\processed_data\MA\4_2025-03-04.md'
Converted 'data\edgar_documents\MA\4_2025-03-06' --> 'data\processed_data\MA\4_2025-03-06.md'
Converted 'data\edgar_documents\MA\4_2025-03-20' --> 'data\processed_data\MA\4_2025-03-20.md'


2025-11-14 17:02:06,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:06,634 - INFO - Going to convert document batch...
2025-11-14 17:02:06,635 - INFO - Processing document 4_2025-03-27
2025-11-14 17:02:06,665 - INFO - Finished converting document 4_2025-03-27 in 0.06 sec.
2025-11-14 17:02:06,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:06,714 - INFO - Going to convert document batch...
2025-11-14 17:02:06,714 - INFO - Processing document 4_2025-04-02
2025-11-14 17:02:06,741 - INFO - Finished converting document 4_2025-04-02 in 0.05 sec.
2025-11-14 17:02:06,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:06,783 - INFO - Going to convert document batch...
2025-11-14 17:02:06,783 - INFO - Processing document 4_2025-04-09
2025-11-14 17:02:06,807 - INFO - Finished converting document 4_2025-04-09 in 0.05 sec.
2025-11-14 17:02:06,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\MA\4_2025-03-27' --> 'data\processed_data\MA\4_2025-03-27.md'
Converted 'data\edgar_documents\MA\4_2025-04-02' --> 'data\processed_data\MA\4_2025-04-02.md'
Converted 'data\edgar_documents\MA\4_2025-04-09' --> 'data\processed_data\MA\4_2025-04-09.md'


2025-11-14 17:02:06,885 - INFO - Finished converting document 4_2025-05-05 in 0.05 sec.
2025-11-14 17:02:06,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:06,935 - INFO - Going to convert document batch...
2025-11-14 17:02:06,936 - INFO - Processing document 4_2025-05-12
2025-11-14 17:02:06,963 - INFO - Finished converting document 4_2025-05-12 in 0.05 sec.
2025-11-14 17:02:07,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:07,027 - INFO - Going to convert document batch...
2025-11-14 17:02:07,028 - INFO - Processing document 4_2025-05-15
2025-11-14 17:02:07,052 - INFO - Finished converting document 4_2025-05-15 in 0.06 sec.
2025-11-14 17:02:07,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2025-05-05' --> 'data\processed_data\MA\4_2025-05-05.md'
Converted 'data\edgar_documents\MA\4_2025-05-12' --> 'data\processed_data\MA\4_2025-05-12.md'
Converted 'data\edgar_documents\MA\4_2025-05-15' --> 'data\processed_data\MA\4_2025-05-15.md'


2025-11-14 17:02:07,103 - INFO - Going to convert document batch...
2025-11-14 17:02:07,104 - INFO - Processing document 4_2025-06-06
2025-11-14 17:02:07,225 - INFO - Finished converting document 4_2025-06-06 in 0.14 sec.
2025-11-14 17:02:07,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:07,345 - INFO - Going to convert document batch...
2025-11-14 17:02:07,346 - INFO - Processing document 4_2025-06-13
2025-11-14 17:02:07,379 - INFO - Finished converting document 4_2025-06-13 in 0.09 sec.
2025-11-14 17:02:07,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:07,432 - INFO - Going to convert document batch...
2025-11-14 17:02:07,432 - INFO - Processing document 4_2025-06-16
2025-11-14 17:02:07,451 - INFO - Finished converting document 4_2025-06-16 in 0.05 sec.


Converted 'data\edgar_documents\MA\4_2025-06-06' --> 'data\processed_data\MA\4_2025-06-06.md'
Converted 'data\edgar_documents\MA\4_2025-06-13' --> 'data\processed_data\MA\4_2025-06-13.md'


2025-11-14 17:02:07,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:07,509 - INFO - Going to convert document batch...
2025-11-14 17:02:07,510 - INFO - Processing document 4_2025-06-17
2025-11-14 17:02:07,568 - INFO - Finished converting document 4_2025-06-17 in 0.09 sec.
2025-11-14 17:02:07,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2025-06-16' --> 'data\processed_data\MA\4_2025-06-16.md'
Converted 'data\edgar_documents\MA\4_2025-06-17' --> 'data\processed_data\MA\4_2025-06-17.md'


2025-11-14 17:02:07,672 - INFO - Going to convert document batch...
2025-11-14 17:02:07,674 - INFO - Processing document 4_2025-06-23
2025-11-14 17:02:07,799 - INFO - Finished converting document 4_2025-06-23 in 0.20 sec.
2025-11-14 17:02:07,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:07,902 - INFO - Going to convert document batch...
2025-11-14 17:02:07,903 - INFO - Processing document 4_2025-06-26
2025-11-14 17:02:07,927 - INFO - Finished converting document 4_2025-06-26 in 0.09 sec.
2025-11-14 17:02:07,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:07,969 - INFO - Going to convert document batch...
2025-11-14 17:02:07,969 - INFO - Processing document 4_2025-06-30
2025-11-14 17:02:07,991 - INFO - Finished converting document 4_2025-06-30 in 0.03 sec.


Converted 'data\edgar_documents\MA\4_2025-06-23' --> 'data\processed_data\MA\4_2025-06-23.md'
Converted 'data\edgar_documents\MA\4_2025-06-26' --> 'data\processed_data\MA\4_2025-06-26.md'


2025-11-14 17:02:08,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:08,040 - INFO - Going to convert document batch...
2025-11-14 17:02:08,041 - INFO - Processing document 4_2025-07-08
2025-11-14 17:02:08,063 - INFO - Finished converting document 4_2025-07-08 in 0.05 sec.
2025-11-14 17:02:08,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:08,118 - INFO - Going to convert document batch...
2025-11-14 17:02:08,119 - INFO - Processing document 4_2025-08-06
2025-11-14 17:02:08,158 - INFO - Finished converting document 4_2025-08-06 in 0.06 sec.
2025-11-14 17:02:08,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:08,213 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MA\4_2025-06-30' --> 'data\processed_data\MA\4_2025-06-30.md'
Converted 'data\edgar_documents\MA\4_2025-07-08' --> 'data\processed_data\MA\4_2025-07-08.md'
Converted 'data\edgar_documents\MA\4_2025-08-06' --> 'data\processed_data\MA\4_2025-08-06.md'


2025-11-14 17:02:08,214 - INFO - Processing document 4_2025-08-20
2025-11-14 17:02:08,266 - INFO - Finished converting document 4_2025-08-20 in 0.08 sec.
2025-11-14 17:02:08,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:08,361 - INFO - Going to convert document batch...
2025-11-14 17:02:08,362 - INFO - Processing document 4_2025-08-25
2025-11-14 17:02:08,385 - INFO - Finished converting document 4_2025-08-25 in 0.06 sec.
2025-11-14 17:02:08,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:08,448 - INFO - Going to convert document batch...
2025-11-14 17:02:08,449 - INFO - Processing document 4_2025-09-03
2025-11-14 17:02:08,491 - INFO - Finished converting document 4_2025-09-03 in 0.08 sec.


Converted 'data\edgar_documents\MA\4_2025-08-20' --> 'data\processed_data\MA\4_2025-08-20.md'
Converted 'data\edgar_documents\MA\4_2025-08-25' --> 'data\processed_data\MA\4_2025-08-25.md'


2025-11-14 17:02:08,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:08,580 - INFO - Going to convert document batch...
2025-11-14 17:02:08,580 - INFO - Processing document 4_2025-09-19
2025-11-14 17:02:08,607 - INFO - Finished converting document 4_2025-09-19 in 0.08 sec.
2025-11-14 17:02:08,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:08,657 - INFO - Going to convert document batch...
2025-11-14 17:02:08,657 - INFO - Processing document 4_2025-10-03
2025-11-14 17:02:08,682 - INFO - Finished converting document 4_2025-10-03 in 0.06 sec.
2025-11-14 17:02:08,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\4_2025-09-03' --> 'data\processed_data\MA\4_2025-09-03.md'
Converted 'data\edgar_documents\MA\4_2025-09-19' --> 'data\processed_data\MA\4_2025-09-19.md'
Converted 'data\edgar_documents\MA\4_2025-10-03' --> 'data\processed_data\MA\4_2025-10-03.md'


2025-11-14 17:02:08,750 - INFO - Going to convert document batch...
2025-11-14 17:02:08,751 - INFO - Processing document 4_2025-11-03
2025-11-14 17:02:08,791 - INFO - Finished converting document 4_2025-11-03 in 0.08 sec.
2025-11-14 17:02:08,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:08,885 - INFO - Going to convert document batch...
2025-11-14 17:02:08,886 - INFO - Processing document 8-K_2023-01-26
2025-11-14 17:02:08,909 - INFO - Finished converting document 8-K_2023-01-26 in 0.09 sec.
2025-11-14 17:02:08,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:08,964 - INFO - Going to convert document batch...
2025-11-14 17:02:08,965 - INFO - Processing document 8-K_2023-02-14
2025-11-14 17:02:08,991 - INFO - Finished converting document 8-K_2023-02-14 in 0.06 sec.


Converted 'data\edgar_documents\MA\4_2025-11-03' --> 'data\processed_data\MA\4_2025-11-03.md'
Converted 'data\edgar_documents\MA\8-K_2023-01-26' --> 'data\processed_data\MA\8-K_2023-01-26.md'


2025-11-14 17:02:09,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:09,046 - INFO - Going to convert document batch...
2025-11-14 17:02:09,046 - INFO - Processing document 8-K_2023-03-03
2025-11-14 17:02:09,073 - INFO - Finished converting document 8-K_2023-03-03 in 0.06 sec.
2025-11-14 17:02:09,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:09,147 - INFO - Going to convert document batch...
2025-11-14 17:02:09,147 - INFO - Processing document 8-K_2023-03-09
2025-11-14 17:02:09,168 - INFO - Finished converting document 8-K_2023-03-09 in 0.08 sec.
2025-11-14 17:02:09,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:09,213 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MA\8-K_2023-02-14' --> 'data\processed_data\MA\8-K_2023-02-14.md'
Converted 'data\edgar_documents\MA\8-K_2023-03-03' --> 'data\processed_data\MA\8-K_2023-03-03.md'
Converted 'data\edgar_documents\MA\8-K_2023-03-09' --> 'data\processed_data\MA\8-K_2023-03-09.md'


2025-11-14 17:02:09,214 - INFO - Processing document 8-K_2023-04-27
2025-11-14 17:02:09,242 - INFO - Finished converting document 8-K_2023-04-27 in 0.06 sec.
2025-11-14 17:02:09,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:09,309 - INFO - Going to convert document batch...
2025-11-14 17:02:09,310 - INFO - Processing document 8-K_2023-05-19
2025-11-14 17:02:09,329 - INFO - Finished converting document 8-K_2023-05-19 in 0.05 sec.
2025-11-14 17:02:09,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:09,397 - INFO - Going to convert document batch...
2025-11-14 17:02:09,398 - INFO - Processing document 8-K_2023-06-29
2025-11-14 17:02:09,457 - INFO - Finished converting document 8-K_2023-06-29 in 0.11 sec.


Converted 'data\edgar_documents\MA\8-K_2023-04-27' --> 'data\processed_data\MA\8-K_2023-04-27.md'
Converted 'data\edgar_documents\MA\8-K_2023-05-19' --> 'data\processed_data\MA\8-K_2023-05-19.md'


2025-11-14 17:02:09,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:09,560 - INFO - Going to convert document batch...
2025-11-14 17:02:09,561 - INFO - Processing document 8-K_2023-07-27
2025-11-14 17:02:09,590 - INFO - Finished converting document 8-K_2023-07-27 in 0.09 sec.
2025-11-14 17:02:09,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:09,661 - INFO - Going to convert document batch...
2025-11-14 17:02:09,662 - INFO - Processing document 8-K_2023-10-26
2025-11-14 17:02:09,682 - INFO - Finished converting document 8-K_2023-10-26 in 0.08 sec.


Converted 'data\edgar_documents\MA\8-K_2023-06-29' --> 'data\processed_data\MA\8-K_2023-06-29.md'
Converted 'data\edgar_documents\MA\8-K_2023-07-27' --> 'data\processed_data\MA\8-K_2023-07-27.md'


2025-11-14 17:02:09,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:09,737 - INFO - Going to convert document batch...
2025-11-14 17:02:09,739 - INFO - Processing document 8-K_2023-12-11
2025-11-14 17:02:09,764 - INFO - Finished converting document 8-K_2023-12-11 in 0.06 sec.


Converted 'data\edgar_documents\MA\8-K_2023-10-26' --> 'data\processed_data\MA\8-K_2023-10-26.md'


2025-11-14 17:02:10,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:10,175 - INFO - Going to convert document batch...
2025-11-14 17:02:10,176 - INFO - Processing document 8-K_2024-01-31
2025-11-14 17:02:10,201 - INFO - Finished converting document 8-K_2024-01-31 in 0.09 sec.
2025-11-14 17:02:10,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:10,249 - INFO - Going to convert document batch...
2025-11-14 17:02:10,250 - INFO - Processing document 8-K_2024-03-26


Converted 'data\edgar_documents\MA\8-K_2023-12-11' --> 'data\processed_data\MA\8-K_2023-12-11.md'
Converted 'data\edgar_documents\MA\8-K_2024-01-31' --> 'data\processed_data\MA\8-K_2024-01-31.md'


2025-11-14 17:02:10,350 - INFO - Finished converting document 8-K_2024-03-26 in 0.12 sec.
2025-11-14 17:02:10,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:10,458 - INFO - Going to convert document batch...
2025-11-14 17:02:10,459 - INFO - Processing document 8-K_2024-05-01
2025-11-14 17:02:10,483 - INFO - Finished converting document 8-K_2024-05-01 in 0.09 sec.
2025-11-14 17:02:10,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:10,534 - INFO - Going to convert document batch...
2025-11-14 17:02:10,535 - INFO - Processing document 8-K_2024-05-09
2025-11-14 17:02:10,559 - INFO - Finished converting document 8-K_2024-05-09 in 0.06 sec.


Converted 'data\edgar_documents\MA\8-K_2024-03-26' --> 'data\processed_data\MA\8-K_2024-03-26.md'
Converted 'data\edgar_documents\MA\8-K_2024-05-01' --> 'data\processed_data\MA\8-K_2024-05-01.md'


2025-11-14 17:02:10,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:10,627 - INFO - Going to convert document batch...
2025-11-14 17:02:10,628 - INFO - Processing document 8-K_2024-06-21
2025-11-14 17:02:10,690 - INFO - Finished converting document 8-K_2024-06-21 in 0.11 sec.
2025-11-14 17:02:10,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:10,758 - INFO - Going to convert document batch...
2025-11-14 17:02:10,759 - INFO - Processing document 8-K_2024-06-28


Converted 'data\edgar_documents\MA\8-K_2024-05-09' --> 'data\processed_data\MA\8-K_2024-05-09.md'
Converted 'data\edgar_documents\MA\8-K_2024-06-21' --> 'data\processed_data\MA\8-K_2024-06-21.md'


2025-11-14 17:02:10,786 - INFO - Finished converting document 8-K_2024-06-28 in 0.05 sec.
2025-11-14 17:02:10,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:10,915 - INFO - Going to convert document batch...
2025-11-14 17:02:10,917 - INFO - Processing document 8-K_2024-07-31
2025-11-14 17:02:10,958 - INFO - Finished converting document 8-K_2024-07-31 in 0.14 sec.
2025-11-14 17:02:11,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\8-K_2024-06-28' --> 'data\processed_data\MA\8-K_2024-06-28.md'
Converted 'data\edgar_documents\MA\8-K_2024-07-31' --> 'data\processed_data\MA\8-K_2024-07-31.md'


2025-11-14 17:02:11,033 - INFO - Going to convert document batch...
2025-11-14 17:02:11,034 - INFO - Processing document 8-K_2024-09-05
2025-11-14 17:02:11,071 - INFO - Finished converting document 8-K_2024-09-05 in 0.09 sec.
2025-11-14 17:02:11,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:11,128 - INFO - Going to convert document batch...
2025-11-14 17:02:11,128 - INFO - Processing document 8-K_2024-10-31
2025-11-14 17:02:11,150 - INFO - Finished converting document 8-K_2024-10-31 in 0.05 sec.
2025-11-14 17:02:11,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:11,194 - INFO - Going to convert document batch...
2025-11-14 17:02:11,195 - INFO - Processing document 8-K_2024-11-13
2025-11-14 17:02:11,220 - INFO - Finished converting document 8-K_2024-11-13 in 0.05 sec.
2025-11-14 17:02:11,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\8-K_2024-09-05' --> 'data\processed_data\MA\8-K_2024-09-05.md'
Converted 'data\edgar_documents\MA\8-K_2024-10-31' --> 'data\processed_data\MA\8-K_2024-10-31.md'
Converted 'data\edgar_documents\MA\8-K_2024-11-13' --> 'data\processed_data\MA\8-K_2024-11-13.md'


2025-11-14 17:02:11,286 - INFO - Going to convert document batch...
2025-11-14 17:02:11,287 - INFO - Processing document 8-K_2025-01-30
2025-11-14 17:02:11,311 - INFO - Finished converting document 8-K_2025-01-30 in 0.06 sec.
2025-11-14 17:02:11,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:11,369 - INFO - Going to convert document batch...
2025-11-14 17:02:11,370 - INFO - Processing document 8-K_2025-02-10
2025-11-14 17:02:11,395 - INFO - Finished converting document 8-K_2025-02-10 in 0.05 sec.
2025-11-14 17:02:11,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:11,447 - INFO - Going to convert document batch...
2025-11-14 17:02:11,448 - INFO - Processing document 8-K_2025-02-26
2025-11-14 17:02:11,475 - INFO - Finished converting document 8-K_2025-02-26 in 0.06 sec.
2025-11-14 17:02:11,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\8-K_2025-01-30' --> 'data\processed_data\MA\8-K_2025-01-30.md'
Converted 'data\edgar_documents\MA\8-K_2025-02-10' --> 'data\processed_data\MA\8-K_2025-02-10.md'
Converted 'data\edgar_documents\MA\8-K_2025-02-26' --> 'data\processed_data\MA\8-K_2025-02-26.md'


2025-11-14 17:02:11,553 - INFO - Going to convert document batch...
2025-11-14 17:02:11,554 - INFO - Processing document 8-K_2025-02-27
2025-11-14 17:02:11,587 - INFO - Finished converting document 8-K_2025-02-27 in 0.08 sec.
2025-11-14 17:02:11,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:11,742 - INFO - Going to convert document batch...
2025-11-14 17:02:11,744 - INFO - Processing document 8-K_2025-05-01
2025-11-14 17:02:11,765 - INFO - Finished converting document 8-K_2025-05-01 in 0.16 sec.


Converted 'data\edgar_documents\MA\8-K_2025-02-27' --> 'data\processed_data\MA\8-K_2025-02-27.md'
Converted 'data\edgar_documents\MA\8-K_2025-05-01' --> 'data\processed_data\MA\8-K_2025-05-01.md'


2025-11-14 17:02:11,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:11,883 - INFO - Going to convert document batch...
2025-11-14 17:02:11,884 - INFO - Processing document 8-K_2025-06-26
2025-11-14 17:02:11,949 - INFO - Finished converting document 8-K_2025-06-26 in 0.17 sec.
2025-11-14 17:02:12,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:12,161 - INFO - Going to convert document batch...
2025-11-14 17:02:12,162 - INFO - Processing document 8-K_2025-07-31
2025-11-14 17:02:12,182 - INFO - Finished converting document 8-K_2025-07-31 in 0.19 sec.


Converted 'data\edgar_documents\MA\8-K_2025-06-26' --> 'data\processed_data\MA\8-K_2025-06-26.md'


2025-11-14 17:02:12,309 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:12,331 - INFO - Going to convert document batch...
2025-11-14 17:02:12,338 - INFO - Processing document 8-K_2025-10-30
2025-11-14 17:02:12,364 - INFO - Finished converting document 8-K_2025-10-30 in 0.16 sec.


Converted 'data\edgar_documents\MA\8-K_2025-07-31' --> 'data\processed_data\MA\8-K_2025-07-31.md'


2025-11-14 17:02:12,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:12,456 - INFO - Going to convert document batch...
2025-11-14 17:02:12,457 - INFO - Processing document 8-K_2025-11-10
2025-11-14 17:02:12,487 - INFO - Finished converting document 8-K_2025-11-10 in 0.09 sec.


Converted 'data\edgar_documents\MA\8-K_2025-10-30' --> 'data\processed_data\MA\8-K_2025-10-30.md'
Converted 'data\edgar_documents\MA\8-K_2025-11-10' --> 'data\processed_data\MA\8-K_2025-11-10.md'


2025-11-14 17:02:12,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:13,582 - INFO - Going to convert document batch...
2025-11-14 17:02:13,583 - INFO - Processing document DEF-14A_2023-04-28
2025-11-14 17:02:19,564 - INFO - Finished converting document DEF-14A_2023-04-28 in 7.05 sec.
2025-11-14 17:02:21,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\DEF-14A_2023-04-28' --> 'data\processed_data\MA\DEF-14A_2023-04-28.md'


2025-11-14 17:02:22,442 - INFO - Going to convert document batch...
2025-11-14 17:02:22,443 - INFO - Processing document DEF-14A_2024-04-26
2025-11-14 17:02:27,651 - INFO - Finished converting document DEF-14A_2024-04-26 in 6.39 sec.
2025-11-14 17:02:29,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\DEF-14A_2024-04-26' --> 'data\processed_data\MA\DEF-14A_2024-04-26.md'


2025-11-14 17:02:30,071 - INFO - Going to convert document batch...
2025-11-14 17:02:30,072 - INFO - Processing document DEF-14A_2025-04-28
2025-11-14 17:02:35,282 - INFO - Finished converting document DEF-14A_2025-04-28 in 6.36 sec.
2025-11-14 17:02:37,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MA\DEF-14A_2025-04-28' --> 'data\processed_data\MA\DEF-14A_2025-04-28.md'
Processed 180 new files. Errors: 4
Found 135 files to process in data\edgar_documents\MCD


2025-11-14 17:02:40,636 - INFO - Going to convert document batch...
2025-11-14 17:02:40,640 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:02:40,642 - INFO - Processing document 10-K_2023-02-24
2025-11-14 17:02:45,000 - INFO - Finished converting document 10-K_2023-02-24 in 7.20 sec.


Converted 'data\edgar_documents\MCD\10-K_2023-02-24' --> 'data\processed_data\MCD\10-K_2023-02-24.md'


2025-11-14 17:02:47,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:02:49,961 - INFO - Going to convert document batch...
2025-11-14 17:02:49,963 - INFO - Processing document 10-K_2024-02-22
2025-11-14 17:02:54,760 - INFO - Finished converting document 10-K_2024-02-22 in 7.73 sec.
2025-11-14 17:02:57,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-K_2024-02-22' --> 'data\processed_data\MCD\10-K_2024-02-22.md'


2025-11-14 17:02:59,265 - INFO - Going to convert document batch...
2025-11-14 17:02:59,267 - INFO - Processing document 10-K_2025-02-25
2025-11-14 17:03:04,798 - INFO - Finished converting document 10-K_2025-02-25 in 7.92 sec.
2025-11-14 17:03:07,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-K_2025-02-25' --> 'data\processed_data\MCD\10-K_2025-02-25.md'


2025-11-14 17:03:08,263 - INFO - Going to convert document batch...
2025-11-14 17:03:08,265 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 17:03:10,677 - INFO - Finished converting document 10-Q_2023-05-04 in 3.59 sec.


Converted 'data\edgar_documents\MCD\10-Q_2023-05-04' --> 'data\processed_data\MCD\10-Q_2023-05-04.md'


2025-11-14 17:03:12,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:03:13,818 - INFO - Going to convert document batch...
2025-11-14 17:03:13,821 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 17:03:16,983 - INFO - Finished converting document 10-Q_2023-08-02 in 4.81 sec.
2025-11-14 17:03:19,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-Q_2023-08-02' --> 'data\processed_data\MCD\10-Q_2023-08-02.md'


2025-11-14 17:03:21,206 - INFO - Going to convert document batch...
2025-11-14 17:03:21,208 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 17:03:24,287 - INFO - Finished converting document 10-Q_2023-11-02 in 5.33 sec.
2025-11-14 17:03:26,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-Q_2023-11-02' --> 'data\processed_data\MCD\10-Q_2023-11-02.md'


2025-11-14 17:03:27,555 - INFO - Going to convert document batch...
2025-11-14 17:03:27,557 - INFO - Processing document 10-Q_2024-05-08
2025-11-14 17:03:30,353 - INFO - Finished converting document 10-Q_2024-05-08 in 4.02 sec.
2025-11-14 17:03:32,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-Q_2024-05-08' --> 'data\processed_data\MCD\10-Q_2024-05-08.md'


2025-11-14 17:03:33,499 - INFO - Going to convert document batch...
2025-11-14 17:03:33,503 - INFO - Processing document 10-Q_2024-08-08
2025-11-14 17:03:36,687 - INFO - Finished converting document 10-Q_2024-08-08 in 4.67 sec.
2025-11-14 17:03:38,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-Q_2024-08-08' --> 'data\processed_data\MCD\10-Q_2024-08-08.md'


2025-11-14 17:03:40,909 - INFO - Going to convert document batch...
2025-11-14 17:03:40,911 - INFO - Processing document 10-Q_2024-11-07
2025-11-14 17:03:43,893 - INFO - Finished converting document 10-Q_2024-11-07 in 5.19 sec.
2025-11-14 17:03:46,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-Q_2024-11-07' --> 'data\processed_data\MCD\10-Q_2024-11-07.md'


2025-11-14 17:03:47,015 - INFO - Going to convert document batch...
2025-11-14 17:03:47,018 - INFO - Processing document 10-Q_2025-05-12
2025-11-14 17:03:49,418 - INFO - Finished converting document 10-Q_2025-05-12 in 3.53 sec.
2025-11-14 17:03:51,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-Q_2025-05-12' --> 'data\processed_data\MCD\10-Q_2025-05-12.md'


2025-11-14 17:03:52,495 - INFO - Going to convert document batch...
2025-11-14 17:03:52,498 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 17:03:56,142 - INFO - Finished converting document 10-Q_2025-08-06 in 5.25 sec.
2025-11-14 17:03:58,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-Q_2025-08-06' --> 'data\processed_data\MCD\10-Q_2025-08-06.md'


2025-11-14 17:03:59,535 - INFO - Going to convert document batch...
2025-11-14 17:03:59,538 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 17:04:02,978 - INFO - Finished converting document 10-Q_2025-11-05 in 4.94 sec.
2025-11-14 17:04:05,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\10-Q_2025-11-05' --> 'data\processed_data\MCD\10-Q_2025-11-05.md'


2025-11-14 17:04:05,120 - INFO - Going to convert document batch...
2025-11-14 17:04:05,123 - INFO - Processing document 4_2023-01-04
2025-11-14 17:04:05,209 - INFO - Finished converting document 4_2023-01-04 in 0.30 sec.
2025-11-14 17:04:05,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:05,432 - INFO - Going to convert document batch...
2025-11-14 17:04:05,434 - INFO - Processing document 4_2023-02-03
2025-11-14 17:04:05,514 - INFO - Finished converting document 4_2023-02-03 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2023-01-04' --> 'data\processed_data\MCD\4_2023-01-04.md'


2025-11-14 17:04:05,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:05,697 - INFO - Going to convert document batch...
2025-11-14 17:04:05,700 - INFO - Processing document 4_2023-02-15


Converted 'data\edgar_documents\MCD\4_2023-02-03' --> 'data\processed_data\MCD\4_2023-02-03.md'


2025-11-14 17:04:05,808 - INFO - Finished converting document 4_2023-02-15 in 0.22 sec.
2025-11-14 17:04:06,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:06,090 - INFO - Going to convert document batch...
2025-11-14 17:04:06,105 - INFO - Processing document 4_2023-02-22


Converted 'data\edgar_documents\MCD\4_2023-02-15' --> 'data\processed_data\MCD\4_2023-02-15.md'


2025-11-14 17:04:06,235 - INFO - Finished converting document 4_2023-02-22 in 0.31 sec.
2025-11-14 17:04:06,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:06,466 - INFO - Going to convert document batch...
2025-11-14 17:04:06,469 - INFO - Processing document 4_2023-02-24
2025-11-14 17:04:06,537 - INFO - Finished converting document 4_2023-02-24 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2023-02-22' --> 'data\processed_data\MCD\4_2023-02-22.md'


2025-11-14 17:04:06,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:06,702 - INFO - Going to convert document batch...
2025-11-14 17:04:06,705 - INFO - Processing document 4_2023-04-04


Converted 'data\edgar_documents\MCD\4_2023-02-24' --> 'data\processed_data\MCD\4_2023-02-24.md'


2025-11-14 17:04:06,879 - INFO - Finished converting document 4_2023-04-04 in 0.25 sec.
2025-11-14 17:04:07,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:07,064 - INFO - Going to convert document batch...
2025-11-14 17:04:07,066 - INFO - Processing document 4_2023-05-02
2025-11-14 17:04:07,133 - INFO - Finished converting document 4_2023-05-02 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2023-04-04' --> 'data\processed_data\MCD\4_2023-04-04.md'


2025-11-14 17:04:07,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:07,325 - INFO - Going to convert document batch...
2025-11-14 17:04:07,327 - INFO - Processing document 4_2023-05-05
2025-11-14 17:04:07,402 - INFO - Finished converting document 4_2023-05-05 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2023-05-02' --> 'data\processed_data\MCD\4_2023-05-02.md'


2025-11-14 17:04:07,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:07,741 - INFO - Going to convert document batch...
2025-11-14 17:04:07,743 - INFO - Processing document 4_2023-05-19


Converted 'data\edgar_documents\MCD\4_2023-05-05' --> 'data\processed_data\MCD\4_2023-05-05.md'


2025-11-14 17:04:07,875 - INFO - Finished converting document 4_2023-05-19 in 0.25 sec.
2025-11-14 17:04:08,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:08,153 - INFO - Going to convert document batch...
2025-11-14 17:04:08,156 - INFO - Processing document 4_2023-05-30


Converted 'data\edgar_documents\MCD\4_2023-05-19' --> 'data\processed_data\MCD\4_2023-05-19.md'


2025-11-14 17:04:08,250 - INFO - Finished converting document 4_2023-05-30 in 0.20 sec.
2025-11-14 17:04:08,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:08,501 - INFO - Going to convert document batch...
2025-11-14 17:04:08,503 - INFO - Processing document 4_2023-05-31


Converted 'data\edgar_documents\MCD\4_2023-05-30' --> 'data\processed_data\MCD\4_2023-05-30.md'


2025-11-14 17:04:08,621 - INFO - Finished converting document 4_2023-05-31 in 0.25 sec.
2025-11-14 17:04:08,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:08,863 - INFO - Going to convert document batch...
2025-11-14 17:04:08,867 - INFO - Processing document 4_2023-06-01


Converted 'data\edgar_documents\MCD\4_2023-05-31' --> 'data\processed_data\MCD\4_2023-05-31.md'


2025-11-14 17:04:08,954 - INFO - Finished converting document 4_2023-06-01 in 0.20 sec.
2025-11-14 17:04:09,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:09,131 - INFO - Going to convert document batch...
2025-11-14 17:04:09,134 - INFO - Processing document 4_2023-06-07
2025-11-14 17:04:09,227 - INFO - Finished converting document 4_2023-06-07 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2023-06-01' --> 'data\processed_data\MCD\4_2023-06-01.md'


2025-11-14 17:04:09,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:09,400 - INFO - Going to convert document batch...
2025-11-14 17:04:09,403 - INFO - Processing document 4_2023-06-23
2025-11-14 17:04:09,504 - INFO - Finished converting document 4_2023-06-23 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2023-06-07' --> 'data\processed_data\MCD\4_2023-06-07.md'


2025-11-14 17:04:09,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:09,725 - INFO - Going to convert document batch...
2025-11-14 17:04:09,727 - INFO - Processing document 4_2023-07-05
2025-11-14 17:04:09,810 - INFO - Finished converting document 4_2023-07-05 in 0.19 sec.


Converted 'data\edgar_documents\MCD\4_2023-06-23' --> 'data\processed_data\MCD\4_2023-06-23.md'


2025-11-14 17:04:09,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:10,019 - INFO - Going to convert document batch...
2025-11-14 17:04:10,023 - INFO - Processing document 4_2023-07-21


Converted 'data\edgar_documents\MCD\4_2023-07-05' --> 'data\processed_data\MCD\4_2023-07-05.md'


2025-11-14 17:04:10,159 - INFO - Finished converting document 4_2023-07-21 in 0.25 sec.
2025-11-14 17:04:10,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:10,324 - INFO - Going to convert document batch...
2025-11-14 17:04:10,326 - INFO - Processing document 4_2023-08-04
2025-11-14 17:04:10,382 - INFO - Finished converting document 4_2023-08-04 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2023-07-21' --> 'data\processed_data\MCD\4_2023-07-21.md'
Converted 'data\edgar_documents\MCD\4_2023-08-04' --> 'data\processed_data\MCD\4_2023-08-04.md'


2025-11-14 17:04:10,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:11,092 - INFO - Going to convert document batch...
2025-11-14 17:04:11,094 - INFO - Processing document 4_2023-08-10
2025-11-14 17:04:11,189 - INFO - Finished converting document 4_2023-08-10 in 0.73 sec.
2025-11-14 17:04:11,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:11,405 - INFO - Going to convert document batch...
2025-11-14 17:04:11,407 - INFO - Processing document 4_2023-08-25


Converted 'data\edgar_documents\MCD\4_2023-08-10' --> 'data\processed_data\MCD\4_2023-08-10.md'


2025-11-14 17:04:11,549 - INFO - Finished converting document 4_2023-08-25 in 0.25 sec.
2025-11-14 17:04:11,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:11,798 - INFO - Going to convert document batch...
2025-11-14 17:04:11,800 - INFO - Processing document 4_2023-09-01
2025-11-14 17:04:11,890 - INFO - Finished converting document 4_2023-09-01 in 0.20 sec.


Converted 'data\edgar_documents\MCD\4_2023-08-25' --> 'data\processed_data\MCD\4_2023-08-25.md'


2025-11-14 17:04:11,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:12,022 - INFO - Going to convert document batch...
2025-11-14 17:04:12,024 - INFO - Processing document 4_2023-09-20
2025-11-14 17:04:12,097 - INFO - Finished converting document 4_2023-09-20 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2023-09-01' --> 'data\processed_data\MCD\4_2023-09-01.md'


2025-11-14 17:04:12,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:12,246 - INFO - Going to convert document batch...
2025-11-14 17:04:12,248 - INFO - Processing document 4_2023-09-22
2025-11-14 17:04:12,343 - INFO - Finished converting document 4_2023-09-22 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2023-09-20' --> 'data\processed_data\MCD\4_2023-09-20.md'


2025-11-14 17:04:12,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:12,494 - INFO - Going to convert document batch...
2025-11-14 17:04:12,496 - INFO - Processing document 4_2023-10-03
2025-11-14 17:04:12,582 - INFO - Finished converting document 4_2023-10-03 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2023-09-22' --> 'data\processed_data\MCD\4_2023-09-22.md'


2025-11-14 17:04:12,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:12,748 - INFO - Going to convert document batch...
2025-11-14 17:04:12,750 - INFO - Processing document 4_2023-10-24
2025-11-14 17:04:12,829 - INFO - Finished converting document 4_2023-10-24 in 0.14 sec.


Converted 'data\edgar_documents\MCD\4_2023-10-03' --> 'data\processed_data\MCD\4_2023-10-03.md'


2025-11-14 17:04:12,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:12,993 - INFO - Going to convert document batch...
2025-11-14 17:04:12,996 - INFO - Processing document 4_2023-11-03


Converted 'data\edgar_documents\MCD\4_2023-10-24' --> 'data\processed_data\MCD\4_2023-10-24.md'


2025-11-14 17:04:13,155 - INFO - Finished converting document 4_2023-11-03 in 0.25 sec.
2025-11-14 17:04:13,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:13,342 - INFO - Going to convert document batch...
2025-11-14 17:04:13,344 - INFO - Processing document 4_2023-11-22
2025-11-14 17:04:13,426 - INFO - Finished converting document 4_2023-11-22 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2023-11-03' --> 'data\processed_data\MCD\4_2023-11-03.md'


2025-11-14 17:04:13,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:13,669 - INFO - Going to convert document batch...
2025-11-14 17:04:13,671 - INFO - Processing document 4_2023-12-01


Converted 'data\edgar_documents\MCD\4_2023-11-22' --> 'data\processed_data\MCD\4_2023-11-22.md'


2025-11-14 17:04:13,735 - INFO - Finished converting document 4_2023-12-01 in 0.20 sec.
2025-11-14 17:04:13,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:13,898 - INFO - Going to convert document batch...
2025-11-14 17:04:13,902 - INFO - Processing document 4_2023-12-22
2025-11-14 17:04:13,983 - INFO - Finished converting document 4_2023-12-22 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2023-12-01' --> 'data\processed_data\MCD\4_2023-12-01.md'


2025-11-14 17:04:14,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:14,162 - INFO - Going to convert document batch...
2025-11-14 17:04:14,166 - INFO - Processing document 4_2024-01-03
2025-11-14 17:04:14,277 - INFO - Finished converting document 4_2024-01-03 in 0.19 sec.


Converted 'data\edgar_documents\MCD\4_2023-12-22' --> 'data\processed_data\MCD\4_2023-12-22.md'


2025-11-14 17:04:14,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:14,425 - INFO - Going to convert document batch...
2025-11-14 17:04:14,428 - INFO - Processing document 4_2024-02-09
2025-11-14 17:04:14,532 - INFO - Finished converting document 4_2024-02-09 in 0.19 sec.


Converted 'data\edgar_documents\MCD\4_2024-01-03' --> 'data\processed_data\MCD\4_2024-01-03.md'


2025-11-14 17:04:14,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:14,704 - INFO - Going to convert document batch...
2025-11-14 17:04:14,706 - INFO - Processing document 4_2024-02-14
2025-11-14 17:04:14,792 - INFO - Finished converting document 4_2024-02-14 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2024-02-09' --> 'data\processed_data\MCD\4_2024-02-09.md'


2025-11-14 17:04:14,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:15,004 - INFO - Going to convert document batch...
2025-11-14 17:04:15,007 - INFO - Processing document 4_2024-02-16
2025-11-14 17:04:15,104 - INFO - Finished converting document 4_2024-02-16 in 0.20 sec.


Converted 'data\edgar_documents\MCD\4_2024-02-14' --> 'data\processed_data\MCD\4_2024-02-14.md'


2025-11-14 17:04:15,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:15,270 - INFO - Going to convert document batch...
2025-11-14 17:04:15,272 - INFO - Processing document 4_2024-02-21
2025-11-14 17:04:15,385 - INFO - Finished converting document 4_2024-02-21 in 0.20 sec.


Converted 'data\edgar_documents\MCD\4_2024-02-16' --> 'data\processed_data\MCD\4_2024-02-16.md'


2025-11-14 17:04:15,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:15,542 - INFO - Going to convert document batch...
2025-11-14 17:04:15,545 - INFO - Processing document 4_2024-02-27
2025-11-14 17:04:15,621 - INFO - Finished converting document 4_2024-02-27 in 0.14 sec.


Converted 'data\edgar_documents\MCD\4_2024-02-21' --> 'data\processed_data\MCD\4_2024-02-21.md'


2025-11-14 17:04:15,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:15,792 - INFO - Going to convert document batch...
2025-11-14 17:04:15,794 - INFO - Processing document 4_2024-03-22
2025-11-14 17:04:15,872 - INFO - Finished converting document 4_2024-03-22 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2024-02-27' --> 'data\processed_data\MCD\4_2024-02-27.md'


2025-11-14 17:04:15,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:16,020 - INFO - Going to convert document batch...
2025-11-14 17:04:16,023 - INFO - Processing document 4_2024-04-02
2025-11-14 17:04:16,114 - INFO - Finished converting document 4_2024-04-02 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2024-03-22' --> 'data\processed_data\MCD\4_2024-03-22.md'


2025-11-14 17:04:16,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:16,387 - INFO - Going to convert document batch...
2025-11-14 17:04:16,389 - INFO - Processing document 4_2024-04-23
2025-11-14 17:04:16,457 - INFO - Finished converting document 4_2024-04-23 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2024-04-02' --> 'data\processed_data\MCD\4_2024-04-02.md'


2025-11-14 17:04:16,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:16,592 - INFO - Going to convert document batch...
2025-11-14 17:04:16,594 - INFO - Processing document 4_2024-05-13
2025-11-14 17:04:16,658 - INFO - Finished converting document 4_2024-05-13 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2024-04-23' --> 'data\processed_data\MCD\4_2024-04-23.md'
Converted 'data\edgar_documents\MCD\4_2024-05-13' --> 'data\processed_data\MCD\4_2024-05-13.md'


2025-11-14 17:04:16,788 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:04:16,791 - ERROR - Input document 4_2024-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:04:16,795 - INFO - Going to convert document batch...
2025-11-14 17:04:16,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:16,896 - INFO - Going to convert document batch...
2025-11-14 17:04:16,899 - INFO - Processing document 4_2024-05-21


Error processing data\edgar_documents\MCD\4_2024-05-15: File format not allowed: data\edgar_documents\MCD\4_2024-05-15


2025-11-14 17:04:17,135 - INFO - Finished converting document 4_2024-05-21 in 0.33 sec.
2025-11-14 17:04:17,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:17,289 - INFO - Going to convert document batch...
2025-11-14 17:04:17,292 - INFO - Processing document 4_2024-05-24
2025-11-14 17:04:17,359 - INFO - Finished converting document 4_2024-05-24 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2024-05-21' --> 'data\processed_data\MCD\4_2024-05-21.md'
Converted 'data\edgar_documents\MCD\4_2024-05-24' --> 'data\processed_data\MCD\4_2024-05-24.md'


2025-11-14 17:04:17,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:17,489 - INFO - Going to convert document batch...
2025-11-14 17:04:17,492 - INFO - Processing document 4_2024-05-30
2025-11-14 17:04:17,592 - INFO - Finished converting document 4_2024-05-30 in 0.17 sec.
2025-11-14 17:04:17,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:17,733 - INFO - Going to convert document batch...
2025-11-14 17:04:17,736 - INFO - Processing document 4_2024-06-21
2025-11-14 17:04:17,804 - INFO - Finished converting document 4_2024-06-21 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2024-05-30' --> 'data\processed_data\MCD\4_2024-05-30.md'
Converted 'data\edgar_documents\MCD\4_2024-06-21' --> 'data\processed_data\MCD\4_2024-06-21.md'


2025-11-14 17:04:17,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:17,935 - INFO - Going to convert document batch...
2025-11-14 17:04:17,937 - INFO - Processing document 4_2024-07-01
2025-11-14 17:04:18,091 - INFO - Finished converting document 4_2024-07-01 in 0.22 sec.
2025-11-14 17:04:18,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:18,319 - INFO - Going to convert document batch...
2025-11-14 17:04:18,321 - INFO - Processing document 4_2024-07-03
2025-11-14 17:04:18,430 - INFO - Finished converting document 4_2024-07-03 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2024-07-01' --> 'data\processed_data\MCD\4_2024-07-01.md'


2025-11-14 17:04:18,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:18,568 - INFO - Going to convert document batch...
2025-11-14 17:04:18,570 - INFO - Processing document 4_2024-07-23
2025-11-14 17:04:18,654 - INFO - Finished converting document 4_2024-07-23 in 0.14 sec.


Converted 'data\edgar_documents\MCD\4_2024-07-03' --> 'data\processed_data\MCD\4_2024-07-03.md'


2025-11-14 17:04:18,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:18,797 - INFO - Going to convert document batch...
2025-11-14 17:04:18,799 - INFO - Processing document 4_2024-08-23
2025-11-14 17:04:18,857 - INFO - Finished converting document 4_2024-08-23 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2024-07-23' --> 'data\processed_data\MCD\4_2024-07-23.md'


2025-11-14 17:04:19,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:19,118 - INFO - Going to convert document batch...
2025-11-14 17:04:19,121 - INFO - Processing document 4_2024-09-03
2025-11-14 17:04:19,204 - INFO - Finished converting document 4_2024-09-03 in 0.20 sec.


Converted 'data\edgar_documents\MCD\4_2024-08-23' --> 'data\processed_data\MCD\4_2024-08-23.md'


2025-11-14 17:04:19,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:19,364 - INFO - Going to convert document batch...
2025-11-14 17:04:19,366 - INFO - Processing document 4_2024-09-18
2025-11-14 17:04:19,457 - INFO - Finished converting document 4_2024-09-18 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2024-09-03' --> 'data\processed_data\MCD\4_2024-09-03.md'


2025-11-14 17:04:19,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:19,703 - INFO - Going to convert document batch...
2025-11-14 17:04:19,706 - INFO - Processing document 4_2024-09-24


Converted 'data\edgar_documents\MCD\4_2024-09-18' --> 'data\processed_data\MCD\4_2024-09-18.md'


2025-11-14 17:04:19,813 - INFO - Finished converting document 4_2024-09-24 in 0.28 sec.
2025-11-14 17:04:19,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:19,987 - INFO - Going to convert document batch...
2025-11-14 17:04:19,989 - INFO - Processing document 4_2024-09-25


Converted 'data\edgar_documents\MCD\4_2024-09-24' --> 'data\processed_data\MCD\4_2024-09-24.md'


2025-11-14 17:04:20,169 - INFO - Finished converting document 4_2024-09-25 in 0.28 sec.
2025-11-14 17:04:20,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:20,344 - INFO - Going to convert document batch...
2025-11-14 17:04:20,346 - INFO - Processing document 4_2024-09-27
2025-11-14 17:04:20,434 - INFO - Finished converting document 4_2024-09-27 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2024-09-25' --> 'data\processed_data\MCD\4_2024-09-25.md'


2025-11-14 17:04:20,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:20,661 - INFO - Going to convert document batch...
2025-11-14 17:04:20,663 - INFO - Processing document 4_2024-10-01


Converted 'data\edgar_documents\MCD\4_2024-09-27' --> 'data\processed_data\MCD\4_2024-09-27.md'


2025-11-14 17:04:20,753 - INFO - Finished converting document 4_2024-10-01 in 0.20 sec.
2025-11-14 17:04:20,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:20,947 - INFO - Going to convert document batch...
2025-11-14 17:04:20,949 - INFO - Processing document 4_2024-10-15


Converted 'data\edgar_documents\MCD\4_2024-10-01' --> 'data\processed_data\MCD\4_2024-10-01.md'


2025-11-14 17:04:21,182 - INFO - Finished converting document 4_2024-10-15 in 0.34 sec.
2025-11-14 17:04:21,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:21,333 - INFO - Going to convert document batch...
2025-11-14 17:04:21,335 - INFO - Processing document 4_2024-10-25
2025-11-14 17:04:21,410 - INFO - Finished converting document 4_2024-10-25 in 0.14 sec.


Converted 'data\edgar_documents\MCD\4_2024-10-15' --> 'data\processed_data\MCD\4_2024-10-15.md'


2025-11-14 17:04:21,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:21,576 - INFO - Going to convert document batch...
2025-11-14 17:04:21,579 - INFO - Processing document 4_2024-11-05


Converted 'data\edgar_documents\MCD\4_2024-10-25' --> 'data\processed_data\MCD\4_2024-10-25.md'


2025-11-14 17:04:21,733 - INFO - Finished converting document 4_2024-11-05 in 0.26 sec.
2025-11-14 17:04:22,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:22,054 - INFO - Going to convert document batch...
2025-11-14 17:04:22,055 - INFO - Processing document 4_2024-11-26
2025-11-14 17:04:22,123 - INFO - Finished converting document 4_2024-11-26 in 0.19 sec.


Converted 'data\edgar_documents\MCD\4_2024-11-05' --> 'data\processed_data\MCD\4_2024-11-05.md'


2025-11-14 17:04:22,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:22,270 - INFO - Going to convert document batch...
2025-11-14 17:04:22,273 - INFO - Processing document 4_2024-12-23
2025-11-14 17:04:22,346 - INFO - Finished converting document 4_2024-12-23 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2024-11-26' --> 'data\processed_data\MCD\4_2024-11-26.md'


2025-11-14 17:04:22,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:22,637 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MCD\4_2024-12-23' --> 'data\processed_data\MCD\4_2024-12-23.md'


2025-11-14 17:04:22,641 - INFO - Processing document 4_2024-12-31
2025-11-14 17:04:22,728 - INFO - Finished converting document 4_2024-12-31 in 0.30 sec.
2025-11-14 17:04:22,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:22,910 - INFO - Going to convert document batch...
2025-11-14 17:04:22,911 - INFO - Processing document 4_2025-01-03
2025-11-14 17:04:22,999 - INFO - Finished converting document 4_2025-01-03 in 0.19 sec.


Converted 'data\edgar_documents\MCD\4_2024-12-31' --> 'data\processed_data\MCD\4_2024-12-31.md'


2025-11-14 17:04:23,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:23,173 - INFO - Going to convert document batch...
2025-11-14 17:04:23,177 - INFO - Processing document 4_2025-01-24
2025-11-14 17:04:23,289 - INFO - Finished converting document 4_2025-01-24 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2025-01-03' --> 'data\processed_data\MCD\4_2025-01-03.md'


2025-11-14 17:04:23,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:23,476 - INFO - Going to convert document batch...
2025-11-14 17:04:23,479 - INFO - Processing document 4_2025-02-13


Converted 'data\edgar_documents\MCD\4_2025-01-24' --> 'data\processed_data\MCD\4_2025-01-24.md'


2025-11-14 17:04:23,596 - INFO - Finished converting document 4_2025-02-13 in 0.22 sec.
2025-11-14 17:04:23,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:23,888 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MCD\4_2025-02-13' --> 'data\processed_data\MCD\4_2025-02-13.md'


2025-11-14 17:04:23,890 - INFO - Processing document 4_2025-02-14
2025-11-14 17:04:24,011 - INFO - Finished converting document 4_2025-02-14 in 0.31 sec.
2025-11-14 17:04:24,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:24,151 - INFO - Going to convert document batch...
2025-11-14 17:04:24,153 - INFO - Processing document 4_2025-02-19
2025-11-14 17:04:24,238 - INFO - Finished converting document 4_2025-02-19 in 0.14 sec.


Converted 'data\edgar_documents\MCD\4_2025-02-14' --> 'data\processed_data\MCD\4_2025-02-14.md'


2025-11-14 17:04:24,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:24,385 - INFO - Going to convert document batch...
2025-11-14 17:04:24,388 - INFO - Processing document 4_2025-02-21
2025-11-14 17:04:24,499 - INFO - Finished converting document 4_2025-02-21 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2025-02-19' --> 'data\processed_data\MCD\4_2025-02-19.md'


2025-11-14 17:04:24,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:24,668 - INFO - Going to convert document batch...
2025-11-14 17:04:24,670 - INFO - Processing document 4_2025-02-25
2025-11-14 17:04:24,768 - INFO - Finished converting document 4_2025-02-25 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2025-02-21' --> 'data\processed_data\MCD\4_2025-02-21.md'


2025-11-14 17:04:24,973 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:04:24,975 - ERROR - Input document 4_2025-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:04:24,978 - INFO - Going to convert document batch...
2025-11-14 17:04:25,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:25,052 - INFO - Going to convert document batch...
2025-11-14 17:04:25,055 - INFO - Processing document 4_2025-02-28
2025-11-14 17:04:25,133 - INFO - Fin

Converted 'data\edgar_documents\MCD\4_2025-02-25' --> 'data\processed_data\MCD\4_2025-02-25.md'
Error processing data\edgar_documents\MCD\4_2025-02-27: File format not allowed: data\edgar_documents\MCD\4_2025-02-27


2025-11-14 17:04:25,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:25,280 - INFO - Going to convert document batch...
2025-11-14 17:04:25,283 - INFO - Processing document 4_2025-03-24
2025-11-14 17:04:25,377 - INFO - Finished converting document 4_2025-03-24 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2025-02-28' --> 'data\processed_data\MCD\4_2025-02-28.md'


2025-11-14 17:04:25,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:25,536 - INFO - Going to convert document batch...
2025-11-14 17:04:25,538 - INFO - Processing document 4_2025-04-02
2025-11-14 17:04:25,631 - INFO - Finished converting document 4_2025-04-02 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2025-03-24' --> 'data\processed_data\MCD\4_2025-03-24.md'


2025-11-14 17:04:25,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:25,876 - INFO - Going to convert document batch...
2025-11-14 17:04:25,879 - INFO - Processing document 4_2025-04-23
2025-11-14 17:04:25,935 - INFO - Finished converting document 4_2025-04-23 in 0.14 sec.


Converted 'data\edgar_documents\MCD\4_2025-04-02' --> 'data\processed_data\MCD\4_2025-04-02.md'
Converted 'data\edgar_documents\MCD\4_2025-04-23' --> 'data\processed_data\MCD\4_2025-04-23.md'


2025-11-14 17:04:26,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:26,086 - INFO - Going to convert document batch...
2025-11-14 17:04:26,088 - INFO - Processing document 4_2025-05-09
2025-11-14 17:04:26,571 - INFO - Finished converting document 4_2025-05-09 in 0.56 sec.
2025-11-14 17:04:26,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:26,750 - INFO - Going to convert document batch...
2025-11-14 17:04:26,752 - INFO - Processing document 4_2025-05-22
2025-11-14 17:04:26,830 - INFO - Finished converting document 4_2025-05-22 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2025-05-09' --> 'data\processed_data\MCD\4_2025-05-09.md'
Converted 'data\edgar_documents\MCD\4_2025-05-22' --> 'data\processed_data\MCD\4_2025-05-22.md'


2025-11-14 17:04:27,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:27,211 - INFO - Going to convert document batch...
2025-11-14 17:04:27,213 - INFO - Processing document 4_2025-05-23
2025-11-14 17:04:27,280 - INFO - Finished converting document 4_2025-05-23 in 0.36 sec.
2025-11-14 17:04:27,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:27,402 - INFO - Going to convert document batch...
2025-11-14 17:04:27,405 - INFO - Processing document 4_2025-06-23
2025-11-14 17:04:27,466 - INFO - Finished converting document 4_2025-06-23 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2025-05-23' --> 'data\processed_data\MCD\4_2025-05-23.md'
Converted 'data\edgar_documents\MCD\4_2025-06-23' --> 'data\processed_data\MCD\4_2025-06-23.md'


2025-11-14 17:04:27,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:27,594 - INFO - Going to convert document batch...
2025-11-14 17:04:27,596 - INFO - Processing document 4_2025-07-01
2025-11-14 17:04:27,688 - INFO - Finished converting document 4_2025-07-01 in 0.16 sec.
2025-11-14 17:04:27,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:27,967 - INFO - Going to convert document batch...
2025-11-14 17:04:27,968 - INFO - Processing document 4_2025-07-10
2025-11-14 17:04:28,036 - INFO - Finished converting document 4_2025-07-10 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2025-07-01' --> 'data\processed_data\MCD\4_2025-07-01.md'


2025-11-14 17:04:28,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:28,192 - INFO - Going to convert document batch...
2025-11-14 17:04:28,194 - INFO - Processing document 4_2025-07-23
2025-11-14 17:04:28,263 - INFO - Finished converting document 4_2025-07-23 in 0.16 sec.


Converted 'data\edgar_documents\MCD\4_2025-07-10' --> 'data\processed_data\MCD\4_2025-07-10.md'


2025-11-14 17:04:28,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:28,465 - INFO - Going to convert document batch...
2025-11-14 17:04:28,482 - INFO - Processing document 4_2025-08-04


Converted 'data\edgar_documents\MCD\4_2025-07-23' --> 'data\processed_data\MCD\4_2025-07-23.md'


2025-11-14 17:04:28,599 - INFO - Finished converting document 4_2025-08-04 in 0.27 sec.
2025-11-14 17:04:28,696 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:28,722 - INFO - Going to convert document batch...
2025-11-14 17:04:28,725 - INFO - Processing document 4_2025-08-06
2025-11-14 17:04:28,793 - INFO - Finished converting document 4_2025-08-06 in 0.12 sec.


Converted 'data\edgar_documents\MCD\4_2025-08-04' --> 'data\processed_data\MCD\4_2025-08-04.md'


2025-11-14 17:04:28,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:28,971 - INFO - Going to convert document batch...
2025-11-14 17:04:28,972 - INFO - Processing document 4_2025-08-12
2025-11-14 17:04:29,068 - INFO - Finished converting document 4_2025-08-12 in 0.19 sec.


Converted 'data\edgar_documents\MCD\4_2025-08-06' --> 'data\processed_data\MCD\4_2025-08-06.md'


2025-11-14 17:04:29,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:29,383 - INFO - Going to convert document batch...
2025-11-14 17:04:29,386 - INFO - Processing document 4_2025-08-13


Converted 'data\edgar_documents\MCD\4_2025-08-12' --> 'data\processed_data\MCD\4_2025-08-12.md'


2025-11-14 17:04:29,493 - INFO - Finished converting document 4_2025-08-13 in 0.20 sec.
2025-11-14 17:04:29,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:29,780 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MCD\4_2025-08-13' --> 'data\processed_data\MCD\4_2025-08-13.md'


2025-11-14 17:04:29,782 - INFO - Processing document 4_2025-08-19
2025-11-14 17:04:29,847 - INFO - Finished converting document 4_2025-08-19 in 0.25 sec.
2025-11-14 17:04:29,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:30,000 - INFO - Going to convert document batch...
2025-11-14 17:04:30,003 - INFO - Processing document 4_2025-08-20
2025-11-14 17:04:30,104 - INFO - Finished converting document 4_2025-08-20 in 0.19 sec.


Converted 'data\edgar_documents\MCD\4_2025-08-19' --> 'data\processed_data\MCD\4_2025-08-19.md'


2025-11-14 17:04:30,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:30,271 - INFO - Going to convert document batch...
2025-11-14 17:04:30,274 - INFO - Processing document 4_2025-09-02


Converted 'data\edgar_documents\MCD\4_2025-08-20' --> 'data\processed_data\MCD\4_2025-08-20.md'


2025-11-14 17:04:30,424 - INFO - Finished converting document 4_2025-09-02 in 0.23 sec.
2025-11-14 17:04:30,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:30,601 - INFO - Going to convert document batch...
2025-11-14 17:04:30,602 - INFO - Processing document 4_2025-10-01


Converted 'data\edgar_documents\MCD\4_2025-09-02' --> 'data\processed_data\MCD\4_2025-09-02.md'


2025-11-14 17:04:30,709 - INFO - Finished converting document 4_2025-10-01 in 0.19 sec.
2025-11-14 17:04:30,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:30,914 - INFO - Going to convert document batch...
2025-11-14 17:04:30,917 - INFO - Processing document 4_2025-10-16


Converted 'data\edgar_documents\MCD\4_2025-10-01' --> 'data\processed_data\MCD\4_2025-10-01.md'


2025-11-14 17:04:31,117 - INFO - Finished converting document 4_2025-10-16 in 0.31 sec.
2025-11-14 17:04:31,274 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:31,318 - INFO - Going to convert document batch...
2025-11-14 17:04:31,322 - INFO - Processing document 4_2025-11-07


Converted 'data\edgar_documents\MCD\4_2025-10-16' --> 'data\processed_data\MCD\4_2025-10-16.md'


2025-11-14 17:04:31,429 - INFO - Finished converting document 4_2025-11-07 in 0.22 sec.
2025-11-14 17:04:31,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:31,625 - INFO - Going to convert document batch...
2025-11-14 17:04:31,627 - INFO - Processing document 8-K_2023-01-06
2025-11-14 17:04:31,694 - INFO - Finished converting document 8-K_2023-01-06 in 0.17 sec.


Converted 'data\edgar_documents\MCD\4_2025-11-07' --> 'data\processed_data\MCD\4_2025-11-07.md'


2025-11-14 17:04:31,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:31,915 - INFO - Going to convert document batch...
2025-11-14 17:04:31,918 - INFO - Processing document 8-K_2023-01-19


Converted 'data\edgar_documents\MCD\8-K_2023-01-06' --> 'data\processed_data\MCD\8-K_2023-01-06.md'


2025-11-14 17:04:32,013 - INFO - Finished converting document 8-K_2023-01-19 in 0.20 sec.
2025-11-14 17:04:32,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:32,171 - INFO - Going to convert document batch...
2025-11-14 17:04:32,174 - INFO - Processing document 8-K_2023-01-31
2025-11-14 17:04:32,235 - INFO - Finished converting document 8-K_2023-01-31 in 0.17 sec.


Converted 'data\edgar_documents\MCD\8-K_2023-01-19' --> 'data\processed_data\MCD\8-K_2023-01-19.md'


2025-11-14 17:04:32,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\8-K_2023-01-31' --> 'data\processed_data\MCD\8-K_2023-01-31.md'


2025-11-14 17:04:32,478 - INFO - Going to convert document batch...
2025-11-14 17:04:32,483 - INFO - Processing document 8-K_2023-02-15
2025-11-14 17:04:32,593 - INFO - Finished converting document 8-K_2023-02-15 in 0.31 sec.
2025-11-14 17:04:32,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:32,740 - INFO - Going to convert document batch...
2025-11-14 17:04:32,742 - INFO - Processing document 8-K_2023-03-29
2025-11-14 17:04:32,825 - INFO - Finished converting document 8-K_2023-03-29 in 0.19 sec.


Converted 'data\edgar_documents\MCD\8-K_2023-02-15' --> 'data\processed_data\MCD\8-K_2023-02-15.md'


2025-11-14 17:04:32,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:32,997 - INFO - Going to convert document batch...
2025-11-14 17:04:33,000 - INFO - Processing document 8-K_2023-04-25


Converted 'data\edgar_documents\MCD\8-K_2023-03-29' --> 'data\processed_data\MCD\8-K_2023-03-29.md'


2025-11-14 17:04:33,093 - INFO - Finished converting document 8-K_2023-04-25 in 0.22 sec.
2025-11-14 17:04:33,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:33,300 - INFO - Going to convert document batch...
2025-11-14 17:04:33,303 - INFO - Processing document 8-K_2023-06-01


Converted 'data\edgar_documents\MCD\8-K_2023-04-25' --> 'data\processed_data\MCD\8-K_2023-04-25.md'


2025-11-14 17:04:33,503 - INFO - Finished converting document 8-K_2023-06-01 in 0.36 sec.
2025-11-14 17:04:33,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:33,726 - INFO - Going to convert document batch...
2025-11-14 17:04:33,729 - INFO - Processing document 8-K_2023-07-27
2025-11-14 17:04:33,808 - INFO - Finished converting document 8-K_2023-07-27 in 0.20 sec.


Converted 'data\edgar_documents\MCD\8-K_2023-06-01' --> 'data\processed_data\MCD\8-K_2023-06-01.md'


2025-11-14 17:04:33,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:33,959 - INFO - Going to convert document batch...
2025-11-14 17:04:33,961 - INFO - Processing document 8-K_2023-08-15
2025-11-14 17:04:34,052 - INFO - Finished converting document 8-K_2023-08-15 in 0.19 sec.


Converted 'data\edgar_documents\MCD\8-K_2023-07-27' --> 'data\processed_data\MCD\8-K_2023-07-27.md'


2025-11-14 17:04:34,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:34,269 - INFO - Going to convert document batch...
2025-11-14 17:04:34,273 - INFO - Processing document 8-K_2023-08-24


Converted 'data\edgar_documents\MCD\8-K_2023-08-15' --> 'data\processed_data\MCD\8-K_2023-08-15.md'


2025-11-14 17:04:34,417 - INFO - Finished converting document 8-K_2023-08-24 in 0.30 sec.
2025-11-14 17:04:34,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:34,582 - INFO - Going to convert document batch...
2025-11-14 17:04:34,584 - INFO - Processing document 8-K_2023-10-30


Converted 'data\edgar_documents\MCD\8-K_2023-08-24' --> 'data\processed_data\MCD\8-K_2023-08-24.md'


2025-11-14 17:04:34,673 - INFO - Finished converting document 8-K_2023-10-30 in 0.20 sec.
2025-11-14 17:04:34,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:34,833 - INFO - Going to convert document batch...
2025-11-14 17:04:34,836 - INFO - Processing document 8-K_2023-12-06
2025-11-14 17:04:34,911 - INFO - Finished converting document 8-K_2023-12-06 in 0.19 sec.


Converted 'data\edgar_documents\MCD\8-K_2023-10-30' --> 'data\processed_data\MCD\8-K_2023-10-30.md'


2025-11-14 17:04:35,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:35,106 - INFO - Going to convert document batch...
2025-11-14 17:04:35,109 - INFO - Processing document 8-K_2024-02-05


Converted 'data\edgar_documents\MCD\8-K_2023-12-06' --> 'data\processed_data\MCD\8-K_2023-12-06.md'


2025-11-14 17:04:35,213 - INFO - Finished converting document 8-K_2024-02-05 in 0.25 sec.
2025-11-14 17:04:35,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:35,331 - INFO - Going to convert document batch...
2025-11-14 17:04:35,334 - INFO - Processing document 8-K_2024-02-16
2025-11-14 17:04:35,445 - INFO - Finished converting document 8-K_2024-02-16 in 0.19 sec.


Converted 'data\edgar_documents\MCD\8-K_2024-02-05' --> 'data\processed_data\MCD\8-K_2024-02-05.md'


2025-11-14 17:04:35,580 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:35,623 - INFO - Going to convert document batch...
2025-11-14 17:04:35,625 - INFO - Processing document 8-K_2024-03-13
2025-11-14 17:04:35,693 - INFO - Finished converting document 8-K_2024-03-13 in 0.17 sec.


Converted 'data\edgar_documents\MCD\8-K_2024-02-16' --> 'data\processed_data\MCD\8-K_2024-02-16.md'


2025-11-14 17:04:35,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:35,792 - INFO - Going to convert document batch...
2025-11-14 17:04:35,794 - INFO - Processing document 8-K_2024-03-19
2025-11-14 17:04:35,868 - INFO - Finished converting document 8-K_2024-03-19 in 0.12 sec.


Converted 'data\edgar_documents\MCD\8-K_2024-03-13' --> 'data\processed_data\MCD\8-K_2024-03-13.md'


2025-11-14 17:04:36,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:36,151 - INFO - Going to convert document batch...
2025-11-14 17:04:36,152 - INFO - Processing document 8-K_2024-04-30
2025-11-14 17:04:36,226 - INFO - Finished converting document 8-K_2024-04-30 in 0.16 sec.


Converted 'data\edgar_documents\MCD\8-K_2024-03-19' --> 'data\processed_data\MCD\8-K_2024-03-19.md'


2025-11-14 17:04:36,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:36,377 - INFO - Going to convert document batch...
2025-11-14 17:04:36,379 - INFO - Processing document 8-K_2024-05-20
2025-11-14 17:04:36,469 - INFO - Finished converting document 8-K_2024-05-20 in 0.20 sec.


Converted 'data\edgar_documents\MCD\8-K_2024-04-30' --> 'data\processed_data\MCD\8-K_2024-04-30.md'


2025-11-14 17:04:36,580 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\8-K_2024-05-20' --> 'data\processed_data\MCD\8-K_2024-05-20.md'


2025-11-14 17:04:36,807 - INFO - Going to convert document batch...
2025-11-14 17:04:36,809 - INFO - Processing document 8-K_2024-05-24
2025-11-14 17:04:36,980 - INFO - Finished converting document 8-K_2024-05-24 in 0.45 sec.
2025-11-14 17:04:37,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:37,132 - INFO - Going to convert document batch...
2025-11-14 17:04:37,134 - INFO - Processing document 8-K_2024-07-26
2025-11-14 17:04:37,230 - INFO - Finished converting document 8-K_2024-07-26 in 0.17 sec.


Converted 'data\edgar_documents\MCD\8-K_2024-05-24' --> 'data\processed_data\MCD\8-K_2024-05-24.md'


2025-11-14 17:04:37,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\8-K_2024-07-26' --> 'data\processed_data\MCD\8-K_2024-07-26.md'


2025-11-14 17:04:37,494 - INFO - Going to convert document batch...
2025-11-14 17:04:37,498 - INFO - Processing document 8-K_2024-07-29
2025-11-14 17:04:37,596 - INFO - Finished converting document 8-K_2024-07-29 in 0.31 sec.
2025-11-14 17:04:37,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:37,734 - INFO - Going to convert document batch...
2025-11-14 17:04:37,736 - INFO - Processing document 8-K_2024-10-29
2025-11-14 17:04:37,806 - INFO - Finished converting document 8-K_2024-10-29 in 0.17 sec.


Converted 'data\edgar_documents\MCD\8-K_2024-07-29' --> 'data\processed_data\MCD\8-K_2024-07-29.md'


2025-11-14 17:04:37,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:37,933 - INFO - Going to convert document batch...
2025-11-14 17:04:37,935 - INFO - Processing document 8-K_2025-01-17
2025-11-14 17:04:38,013 - INFO - Finished converting document 8-K_2025-01-17 in 0.17 sec.


Converted 'data\edgar_documents\MCD\8-K_2024-10-29' --> 'data\processed_data\MCD\8-K_2024-10-29.md'


2025-11-14 17:04:38,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:38,113 - INFO - Going to convert document batch...
2025-11-14 17:04:38,115 - INFO - Processing document 8-K_2025-02-10


Converted 'data\edgar_documents\MCD\8-K_2025-01-17' --> 'data\processed_data\MCD\8-K_2025-01-17.md'


2025-11-14 17:04:38,245 - INFO - Finished converting document 8-K_2025-02-10 in 0.20 sec.
2025-11-14 17:04:38,389 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:38,426 - INFO - Going to convert document batch...
2025-11-14 17:04:38,427 - INFO - Processing document 8-K_2025-02-14
2025-11-14 17:04:38,507 - INFO - Finished converting document 8-K_2025-02-14 in 0.17 sec.


Converted 'data\edgar_documents\MCD\8-K_2025-02-10' --> 'data\processed_data\MCD\8-K_2025-02-10.md'


2025-11-14 17:04:38,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:38,650 - INFO - Going to convert document batch...
2025-11-14 17:04:38,652 - INFO - Processing document 8-K_2025-03-04
2025-11-14 17:04:38,728 - INFO - Finished converting document 8-K_2025-03-04 in 0.17 sec.


Converted 'data\edgar_documents\MCD\8-K_2025-02-14' --> 'data\processed_data\MCD\8-K_2025-02-14.md'


2025-11-14 17:04:38,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:38,895 - INFO - Going to convert document batch...
2025-11-14 17:04:38,898 - INFO - Processing document 8-K_2025-03-11


Converted 'data\edgar_documents\MCD\8-K_2025-03-04' --> 'data\processed_data\MCD\8-K_2025-03-04.md'


2025-11-14 17:04:39,066 - INFO - Finished converting document 8-K_2025-03-11 in 0.23 sec.
2025-11-14 17:04:39,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:39,245 - INFO - Going to convert document batch...
2025-11-14 17:04:39,247 - INFO - Processing document 8-K_2025-05-01
2025-11-14 17:04:39,320 - INFO - Finished converting document 8-K_2025-05-01 in 0.14 sec.


Converted 'data\edgar_documents\MCD\8-K_2025-03-11' --> 'data\processed_data\MCD\8-K_2025-03-11.md'
Converted 'data\edgar_documents\MCD\8-K_2025-05-01' --> 'data\processed_data\MCD\8-K_2025-05-01.md'


2025-11-14 17:04:39,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:39,474 - INFO - Going to convert document batch...
2025-11-14 17:04:39,476 - INFO - Processing document 8-K_2025-05-23
2025-11-14 17:04:39,631 - INFO - Finished converting document 8-K_2025-05-23 in 0.27 sec.
2025-11-14 17:04:39,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:39,813 - INFO - Going to convert document batch...
2025-11-14 17:04:39,815 - INFO - Processing document 8-K_2025-08-06
2025-11-14 17:04:39,901 - INFO - Finished converting document 8-K_2025-08-06 in 0.20 sec.


Converted 'data\edgar_documents\MCD\8-K_2025-05-23' --> 'data\processed_data\MCD\8-K_2025-05-23.md'


2025-11-14 17:04:40,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:40,055 - INFO - Going to convert document batch...
2025-11-14 17:04:40,057 - INFO - Processing document 8-K_2025-08-27


Converted 'data\edgar_documents\MCD\8-K_2025-08-06' --> 'data\processed_data\MCD\8-K_2025-08-06.md'


2025-11-14 17:04:40,157 - INFO - Finished converting document 8-K_2025-08-27 in 0.20 sec.
2025-11-14 17:04:40,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:40,389 - INFO - Going to convert document batch...
2025-11-14 17:04:40,400 - INFO - Processing document 8-K_2025-11-05


Converted 'data\edgar_documents\MCD\8-K_2025-08-27' --> 'data\processed_data\MCD\8-K_2025-08-27.md'


2025-11-14 17:04:40,565 - INFO - Finished converting document 8-K_2025-11-05 in 0.34 sec.


Converted 'data\edgar_documents\MCD\8-K_2025-11-05' --> 'data\processed_data\MCD\8-K_2025-11-05.md'


2025-11-14 17:04:40,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:04:44,781 - INFO - Going to convert document batch...
2025-11-14 17:04:44,783 - INFO - Processing document DEF-14A_2023-04-14
2025-11-14 17:05:15,821 - INFO - Finished converting document DEF-14A_2023-04-14 in 35.22 sec.
2025-11-14 17:05:20,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\DEF-14A_2023-04-14' --> 'data\processed_data\MCD\DEF-14A_2023-04-14.md'


2025-11-14 17:05:23,409 - INFO - Going to convert document batch...
2025-11-14 17:05:23,411 - INFO - Processing document DEF-14A_2024-04-08
2025-11-14 17:05:49,988 - INFO - Finished converting document DEF-14A_2024-04-08 in 30.03 sec.
2025-11-14 17:05:54,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MCD\DEF-14A_2024-04-08' --> 'data\processed_data\MCD\DEF-14A_2024-04-08.md'


2025-11-14 17:05:57,116 - INFO - Going to convert document batch...
2025-11-14 17:05:57,118 - INFO - Processing document DEF-14A_2025-04-07
2025-11-14 17:06:24,890 - INFO - Finished converting document DEF-14A_2025-04-07 in 30.98 sec.


Converted 'data\edgar_documents\MCD\DEF-14A_2025-04-07' --> 'data\processed_data\MCD\DEF-14A_2025-04-07.md'
Processed 133 new files. Errors: 2
Found 83 files to process in data\edgar_documents\MDLZ


2025-11-14 17:06:28,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:06:33,577 - INFO - Going to convert document batch...
2025-11-14 17:06:33,579 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:06:33,583 - INFO - Processing document 10-K_2023-02-03
2025-11-14 17:06:50,894 - INFO - Finished converting document 10-K_2023-02-03 in 22.23 sec.


Converted 'data\edgar_documents\MDLZ\10-K_2023-02-03' --> 'data\processed_data\MDLZ\10-K_2023-02-03.md'


2025-11-14 17:06:55,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:06:59,610 - INFO - Going to convert document batch...
2025-11-14 17:06:59,612 - INFO - Processing document 10-K_2024-02-02
2025-11-14 17:07:18,418 - INFO - Finished converting document 10-K_2024-02-02 in 23.45 sec.
2025-11-14 17:07:22,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-K_2024-02-02' --> 'data\processed_data\MDLZ\10-K_2024-02-02.md'


2025-11-14 17:07:27,736 - INFO - Going to convert document batch...
2025-11-14 17:07:27,738 - INFO - Processing document 10-K_2025-02-05
2025-11-14 17:07:46,230 - INFO - Finished converting document 10-K_2025-02-05 in 23.51 sec.
2025-11-14 17:07:50,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-K_2025-02-05' --> 'data\processed_data\MDLZ\10-K_2025-02-05.md'


2025-11-14 17:07:53,828 - INFO - Going to convert document batch...
2025-11-14 17:07:53,831 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 17:07:58,606 - INFO - Finished converting document 10-Q_2023-04-27 in 7.98 sec.
2025-11-14 17:08:00,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-Q_2023-04-27' --> 'data\processed_data\MDLZ\10-Q_2023-04-27.md'


2025-11-14 17:08:03,269 - INFO - Going to convert document batch...
2025-11-14 17:08:03,271 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 17:08:08,901 - INFO - Finished converting document 10-Q_2023-07-27 in 8.20 sec.
2025-11-14 17:08:12,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-Q_2023-07-27' --> 'data\processed_data\MDLZ\10-Q_2023-07-27.md'


2025-11-14 17:08:14,898 - INFO - Going to convert document batch...
2025-11-14 17:08:14,900 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 17:08:20,582 - INFO - Finished converting document 10-Q_2023-11-01 in 8.28 sec.
2025-11-14 17:08:23,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-Q_2023-11-01' --> 'data\processed_data\MDLZ\10-Q_2023-11-01.md'


2025-11-14 17:08:25,538 - INFO - Going to convert document batch...
2025-11-14 17:08:25,540 - INFO - Processing document 10-Q_2024-04-30
2025-11-14 17:08:30,235 - INFO - Finished converting document 10-Q_2024-04-30 in 6.58 sec.
2025-11-14 17:08:32,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-Q_2024-04-30' --> 'data\processed_data\MDLZ\10-Q_2024-04-30.md'


2025-11-14 17:08:35,465 - INFO - Going to convert document batch...
2025-11-14 17:08:35,466 - INFO - Processing document 10-Q_2024-07-30
2025-11-14 17:08:41,530 - INFO - Finished converting document 10-Q_2024-07-30 in 9.38 sec.
2025-11-14 17:08:44,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-Q_2024-07-30' --> 'data\processed_data\MDLZ\10-Q_2024-07-30.md'


2025-11-14 17:08:47,232 - INFO - Going to convert document batch...
2025-11-14 17:08:47,234 - INFO - Processing document 10-Q_2024-10-29
2025-11-14 17:08:53,573 - INFO - Finished converting document 10-Q_2024-10-29 in 9.52 sec.
2025-11-14 17:08:56,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-Q_2024-10-29' --> 'data\processed_data\MDLZ\10-Q_2024-10-29.md'


2025-11-14 17:08:58,090 - INFO - Going to convert document batch...
2025-11-14 17:08:58,092 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 17:09:03,120 - INFO - Finished converting document 10-Q_2025-04-29 in 7.03 sec.
2025-11-14 17:09:05,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-Q_2025-04-29' --> 'data\processed_data\MDLZ\10-Q_2025-04-29.md'


2025-11-14 17:09:07,653 - INFO - Going to convert document batch...
2025-11-14 17:09:07,655 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 17:09:13,069 - INFO - Finished converting document 10-Q_2025-07-29 in 7.84 sec.
2025-11-14 17:09:15,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\10-Q_2025-07-29' --> 'data\processed_data\MDLZ\10-Q_2025-07-29.md'


2025-11-14 17:09:18,723 - INFO - Going to convert document batch...
2025-11-14 17:09:18,727 - INFO - Processing document 10-Q_2025-10-28
2025-11-14 17:09:24,652 - INFO - Finished converting document 10-Q_2025-10-28 in 9.11 sec.
2025-11-14 17:09:27,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:27,241 - INFO - Going to convert document batch...
2025-11-14 17:09:27,243 - INFO - Processing document 4_2023-01-05
2025-11-14 17:09:27,320 - INFO - Finished converting document 4_2023-01-05 in 0.17 sec.


Converted 'data\edgar_documents\MDLZ\10-Q_2025-10-28' --> 'data\processed_data\MDLZ\10-Q_2025-10-28.md'


2025-11-14 17:09:27,490 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:27,519 - INFO - Going to convert document batch...
2025-11-14 17:09:27,523 - INFO - Processing document 4_2023-02-06
2025-11-14 17:09:27,614 - INFO - Finished converting document 4_2023-02-06 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\4_2023-01-05' --> 'data\processed_data\MDLZ\4_2023-01-05.md'


2025-11-14 17:09:27,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:27,804 - INFO - Going to convert document batch...
2025-11-14 17:09:27,810 - INFO - Processing document 4_2023-02-23
2025-11-14 17:09:27,903 - INFO - Finished converting document 4_2023-02-23 in 0.20 sec.


Converted 'data\edgar_documents\MDLZ\4_2023-02-06' --> 'data\processed_data\MDLZ\4_2023-02-06.md'


2025-11-14 17:09:28,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:28,055 - INFO - Going to convert document batch...
2025-11-14 17:09:28,057 - INFO - Processing document 4_2023-03-01


Converted 'data\edgar_documents\MDLZ\4_2023-02-23' --> 'data\processed_data\MDLZ\4_2023-02-23.md'


2025-11-14 17:09:28,208 - INFO - Finished converting document 4_2023-03-01 in 0.23 sec.
2025-11-14 17:09:28,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:28,387 - INFO - Going to convert document batch...
2025-11-14 17:09:28,390 - INFO - Processing document 4_2023-03-03
2025-11-14 17:09:28,466 - INFO - Finished converting document 4_2023-03-03 in 0.14 sec.


Converted 'data\edgar_documents\MDLZ\4_2023-03-01' --> 'data\processed_data\MDLZ\4_2023-03-01.md'


2025-11-14 17:09:28,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:28,626 - INFO - Going to convert document batch...
2025-11-14 17:09:28,628 - INFO - Processing document 4_2023-03-06
2025-11-14 17:09:28,701 - INFO - Finished converting document 4_2023-03-06 in 0.17 sec.


Converted 'data\edgar_documents\MDLZ\4_2023-03-03' --> 'data\processed_data\MDLZ\4_2023-03-03.md'
Converted 'data\edgar_documents\MDLZ\4_2023-03-06' --> 'data\processed_data\MDLZ\4_2023-03-06.md'


2025-11-14 17:09:29,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:29,227 - INFO - Going to convert document batch...
2025-11-14 17:09:29,232 - INFO - Processing document 4_2023-05-05
2025-11-14 17:09:29,343 - INFO - Finished converting document 4_2023-05-05 in 0.47 sec.
2025-11-14 17:09:29,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:29,558 - INFO - Going to convert document batch...
2025-11-14 17:09:29,561 - INFO - Processing document 4_2023-05-18
2025-11-14 17:09:29,641 - INFO - Finished converting document 4_2023-05-18 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\4_2023-05-05' --> 'data\processed_data\MDLZ\4_2023-05-05.md'


2025-11-14 17:09:29,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:29,827 - INFO - Going to convert document batch...
2025-11-14 17:09:29,829 - INFO - Processing document 4_2023-07-24
2025-11-14 17:09:29,910 - INFO - Finished converting document 4_2023-07-24 in 0.16 sec.


Converted 'data\edgar_documents\MDLZ\4_2023-05-18' --> 'data\processed_data\MDLZ\4_2023-05-18.md'


2025-11-14 17:09:30,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:30,191 - INFO - Going to convert document batch...
2025-11-14 17:09:30,193 - INFO - Processing document 4_2024-02-02
2025-11-14 17:09:30,268 - INFO - Finished converting document 4_2024-02-02 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\4_2023-07-24' --> 'data\processed_data\MDLZ\4_2023-07-24.md'


2025-11-14 17:09:30,425 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:09:30,426 - ERROR - Input document 4_2024-02-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:09:30,429 - INFO - Going to convert document batch...
2025-11-14 17:09:30,481 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:09:30,483 - ERROR - Input document 4_2024-02-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\MDLZ\4_2024-02-02' --> 'data\processed_data\MDLZ\4_2024-02-02.md'
Error processing data\edgar_documents\MDLZ\4_2024-02-15: File format not allowed: data\edgar_documents\MDLZ\4_2024-02-15
Error processing data\edgar_documents\MDLZ\4_2024-02-16: File format not allowed: data\edgar_documents\MDLZ\4_2024-02-16


2025-11-14 17:09:30,553 - INFO - Processing document 4_2024-02-29
2025-11-14 17:09:30,705 - INFO - Finished converting document 4_2024-02-29 in 0.22 sec.
2025-11-14 17:09:30,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:30,926 - INFO - Going to convert document batch...
2025-11-14 17:09:30,928 - INFO - Processing document 4_2024-04-04
2025-11-14 17:09:30,989 - INFO - Finished converting document 4_2024-04-04 in 0.16 sec.


Converted 'data\edgar_documents\MDLZ\4_2024-02-29' --> 'data\processed_data\MDLZ\4_2024-02-29.md'


2025-11-14 17:09:31,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:31,122 - INFO - Going to convert document batch...
2025-11-14 17:09:31,125 - INFO - Processing document 4_2024-05-24
2025-11-14 17:09:31,197 - INFO - Finished converting document 4_2024-05-24 in 0.14 sec.


Converted 'data\edgar_documents\MDLZ\4_2024-04-04' --> 'data\processed_data\MDLZ\4_2024-04-04.md'


2025-11-14 17:09:31,348 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:09:31,349 - ERROR - Input document 4_2024-06-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:09:31,354 - INFO - Going to convert document batch...
2025-11-14 17:09:31,406 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:09:31,408 - ERROR - Input document 4_2024-06-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\MDLZ\4_2024-05-24' --> 'data\processed_data\MDLZ\4_2024-05-24.md'
Error processing data\edgar_documents\MDLZ\4_2024-06-26: File format not allowed: data\edgar_documents\MDLZ\4_2024-06-26
Error processing data\edgar_documents\MDLZ\4_2024-06-28: File format not allowed: data\edgar_documents\MDLZ\4_2024-06-28


2025-11-14 17:09:31,474 - ERROR - Input document 4_2024-08-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:09:31,478 - INFO - Going to convert document batch...
2025-11-14 17:09:31,543 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:09:31,545 - ERROR - Input document 4_2024-08-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\MDLZ\4_2024-08-22: File format not allowed: data\edgar_documents\MDLZ\4_2024-08-22
Error processing data\edgar_documents\MDLZ\4_2024-08-23: File format not allowed: data\edgar_documents\MDLZ\4_2024-08-23


2025-11-14 17:09:31,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:31,891 - INFO - Going to convert document batch...
2025-11-14 17:09:31,893 - INFO - Processing document 4_2025-01-03
2025-11-14 17:09:31,962 - INFO - Finished converting document 4_2025-01-03 in 0.16 sec.


Converted 'data\edgar_documents\MDLZ\4_2024-09-11' --> 'data\processed_data\MDLZ\4_2024-09-11.md'


2025-11-14 17:09:32,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:32,128 - INFO - Going to convert document batch...
2025-11-14 17:09:32,132 - INFO - Processing document 4_2025-02-14
2025-11-14 17:09:32,221 - INFO - Finished converting document 4_2025-02-14 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\4_2025-01-03' --> 'data\processed_data\MDLZ\4_2025-01-03.md'


2025-11-14 17:09:32,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:32,409 - INFO - Going to convert document batch...
2025-11-14 17:09:32,411 - INFO - Processing document 4_2025-03-06


Converted 'data\edgar_documents\MDLZ\4_2025-02-14' --> 'data\processed_data\MDLZ\4_2025-02-14.md'


2025-11-14 17:09:32,639 - INFO - Finished converting document 4_2025-03-06 in 0.34 sec.
2025-11-14 17:09:32,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:32,792 - INFO - Going to convert document batch...
2025-11-14 17:09:32,794 - INFO - Processing document 4_2025-03-13
2025-11-14 17:09:32,870 - INFO - Finished converting document 4_2025-03-13 in 0.16 sec.


Converted 'data\edgar_documents\MDLZ\4_2025-03-06' --> 'data\processed_data\MDLZ\4_2025-03-06.md'


2025-11-14 17:09:33,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\4_2025-03-13' --> 'data\processed_data\MDLZ\4_2025-03-13.md'


2025-11-14 17:09:33,897 - INFO - Going to convert document batch...
2025-11-14 17:09:33,899 - INFO - Processing document 4_2025-03-19
2025-11-14 17:09:33,981 - INFO - Finished converting document 4_2025-03-19 in 1.03 sec.
2025-11-14 17:09:34,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:34,151 - INFO - Going to convert document batch...
2025-11-14 17:09:34,154 - INFO - Processing document 4_2025-04-03
2025-11-14 17:09:34,220 - INFO - Finished converting document 4_2025-04-03 in 0.14 sec.


Converted 'data\edgar_documents\MDLZ\4_2025-03-19' --> 'data\processed_data\MDLZ\4_2025-03-19.md'


2025-11-14 17:09:34,378 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:09:34,380 - ERROR - Input document 4_2025-05-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:09:34,385 - INFO - Going to convert document batch...
2025-11-14 17:09:34,442 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:09:34,445 - ERROR - Input document 4_2025-05-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\MDLZ\4_2025-04-03' --> 'data\processed_data\MDLZ\4_2025-04-03.md'
Error processing data\edgar_documents\MDLZ\4_2025-05-01: File format not allowed: data\edgar_documents\MDLZ\4_2025-05-01
Error processing data\edgar_documents\MDLZ\4_2025-05-02: File format not allowed: data\edgar_documents\MDLZ\4_2025-05-02


2025-11-14 17:09:34,515 - INFO - Going to convert document batch...
2025-11-14 17:09:34,517 - INFO - Processing document 4_2025-05-22
2025-11-14 17:09:34,607 - INFO - Finished converting document 4_2025-05-22 in 0.16 sec.
2025-11-14 17:09:34,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:34,799 - INFO - Going to convert document batch...
2025-11-14 17:09:34,801 - INFO - Processing document 4_2025-07-02
2025-11-14 17:09:34,899 - INFO - Finished converting document 4_2025-07-02 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\4_2025-05-22' --> 'data\processed_data\MDLZ\4_2025-05-22.md'


2025-11-14 17:09:35,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:35,098 - INFO - Going to convert document batch...
2025-11-14 17:09:35,102 - INFO - Processing document 8-K_2023-01-31


Converted 'data\edgar_documents\MDLZ\4_2025-07-02' --> 'data\processed_data\MDLZ\4_2025-07-02.md'


2025-11-14 17:09:35,182 - INFO - Finished converting document 8-K_2023-01-31 in 0.20 sec.
2025-11-14 17:09:35,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:35,346 - INFO - Going to convert document batch...
2025-11-14 17:09:35,348 - INFO - Processing document 8-K_2023-02-07
2025-11-14 17:09:35,429 - INFO - Finished converting document 8-K_2023-02-07 in 0.17 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2023-01-31' --> 'data\processed_data\MDLZ\8-K_2023-01-31.md'


2025-11-14 17:09:35,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:35,595 - INFO - Going to convert document batch...
2025-11-14 17:09:35,597 - INFO - Processing document 8-K_2023-02-21


Converted 'data\edgar_documents\MDLZ\8-K_2023-02-07' --> 'data\processed_data\MDLZ\8-K_2023-02-07.md'


2025-11-14 17:09:35,705 - INFO - Finished converting document 8-K_2023-02-21 in 0.22 sec.
2025-11-14 17:09:35,833 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:35,894 - INFO - Going to convert document batch...
2025-11-14 17:09:35,896 - INFO - Processing document 8-K_2023-02-22


Converted 'data\edgar_documents\MDLZ\8-K_2023-02-21' --> 'data\processed_data\MDLZ\8-K_2023-02-21.md'


2025-11-14 17:09:36,025 - INFO - Finished converting document 8-K_2023-02-22 in 0.25 sec.
2025-11-14 17:09:36,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\8-K_2023-02-22' --> 'data\processed_data\MDLZ\8-K_2023-02-22.md'


2025-11-14 17:09:36,309 - INFO - Going to convert document batch...
2025-11-14 17:09:36,312 - INFO - Processing document 8-K_2023-04-06
2025-11-14 17:09:36,389 - INFO - Finished converting document 8-K_2023-04-06 in 0.31 sec.
2025-11-14 17:09:36,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:36,604 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MDLZ\8-K_2023-04-06' --> 'data\processed_data\MDLZ\8-K_2023-04-06.md'


2025-11-14 17:09:36,607 - INFO - Processing document 8-K_2023-04-11
2025-11-14 17:09:36,775 - INFO - Finished converting document 8-K_2023-04-11 in 0.34 sec.
2025-11-14 17:09:36,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:36,964 - INFO - Going to convert document batch...
2025-11-14 17:09:36,967 - INFO - Processing document 8-K_2023-04-27
2025-11-14 17:09:37,030 - INFO - Finished converting document 8-K_2023-04-27 in 0.17 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2023-04-11' --> 'data\processed_data\MDLZ\8-K_2023-04-11.md'


2025-11-14 17:09:37,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:37,197 - INFO - Going to convert document batch...
2025-11-14 17:09:37,199 - INFO - Processing document 8-K_2023-05-02


Converted 'data\edgar_documents\MDLZ\8-K_2023-04-27' --> 'data\processed_data\MDLZ\8-K_2023-04-27.md'


2025-11-14 17:09:37,294 - INFO - Finished converting document 8-K_2023-05-02 in 0.22 sec.
2025-11-14 17:09:37,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:37,633 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MDLZ\8-K_2023-05-02' --> 'data\processed_data\MDLZ\8-K_2023-05-02.md'


2025-11-14 17:09:37,635 - INFO - Processing document 8-K_2023-05-19
2025-11-14 17:09:37,765 - INFO - Finished converting document 8-K_2023-05-19 in 0.33 sec.
2025-11-14 17:09:37,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:37,962 - INFO - Going to convert document batch...
2025-11-14 17:09:37,964 - INFO - Processing document 8-K_2023-07-20
2025-11-14 17:09:38,028 - INFO - Finished converting document 8-K_2023-07-20 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2023-05-19' --> 'data\processed_data\MDLZ\8-K_2023-05-19.md'


2025-11-14 17:09:38,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:38,211 - INFO - Going to convert document batch...
2025-11-14 17:09:38,213 - INFO - Processing document 8-K_2023-07-27


Converted 'data\edgar_documents\MDLZ\8-K_2023-07-20' --> 'data\processed_data\MDLZ\8-K_2023-07-20.md'


2025-11-14 17:09:38,291 - INFO - Finished converting document 8-K_2023-07-27 in 0.23 sec.
2025-11-14 17:09:38,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:38,532 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MDLZ\8-K_2023-07-27' --> 'data\processed_data\MDLZ\8-K_2023-07-27.md'


2025-11-14 17:09:38,536 - INFO - Processing document 8-K_2023-10-10
2025-11-14 17:09:38,712 - INFO - Finished converting document 8-K_2023-10-10 in 0.36 sec.
2025-11-14 17:09:38,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:38,961 - INFO - Going to convert document batch...
2025-11-14 17:09:38,963 - INFO - Processing document 8-K_2023-10-18
2025-11-14 17:09:39,032 - INFO - Finished converting document 8-K_2023-10-18 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2023-10-10' --> 'data\processed_data\MDLZ\8-K_2023-10-10.md'


2025-11-14 17:09:39,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:39,174 - INFO - Going to convert document batch...
2025-11-14 17:09:39,178 - INFO - Processing document 8-K_2023-11-01


Converted 'data\edgar_documents\MDLZ\8-K_2023-10-18' --> 'data\processed_data\MDLZ\8-K_2023-10-18.md'


2025-11-14 17:09:39,269 - INFO - Finished converting document 8-K_2023-11-01 in 0.20 sec.
2025-11-14 17:09:39,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:39,505 - INFO - Going to convert document batch...
2025-11-14 17:09:39,507 - INFO - Processing document 8-K_2024-01-30
2025-11-14 17:09:39,559 - INFO - Finished converting document 8-K_2024-01-30 in 0.16 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2023-11-01' --> 'data\processed_data\MDLZ\8-K_2023-11-01.md'


2025-11-14 17:09:39,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:39,701 - INFO - Going to convert document batch...
2025-11-14 17:09:39,704 - INFO - Processing document 8-K_2024-02-02


Converted 'data\edgar_documents\MDLZ\8-K_2024-01-30' --> 'data\processed_data\MDLZ\8-K_2024-01-30.md'


2025-11-14 17:09:39,791 - INFO - Finished converting document 8-K_2024-02-02 in 0.19 sec.
2025-11-14 17:09:39,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:40,053 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MDLZ\8-K_2024-02-02' --> 'data\processed_data\MDLZ\8-K_2024-02-02.md'


2025-11-14 17:09:40,056 - INFO - Processing document 8-K_2024-02-20
2025-11-14 17:09:40,226 - INFO - Finished converting document 8-K_2024-02-20 in 0.36 sec.
2025-11-14 17:09:40,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:40,383 - INFO - Going to convert document batch...
2025-11-14 17:09:40,385 - INFO - Processing document 8-K_2024-02-21
2025-11-14 17:09:40,449 - INFO - Finished converting document 8-K_2024-02-21 in 0.16 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2024-02-20' --> 'data\processed_data\MDLZ\8-K_2024-02-20.md'


2025-11-14 17:09:40,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:40,607 - INFO - Going to convert document batch...
2025-11-14 17:09:40,610 - INFO - Processing document 8-K_2024-04-30
2025-11-14 17:09:40,691 - INFO - Finished converting document 8-K_2024-04-30 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2024-02-21' --> 'data\processed_data\MDLZ\8-K_2024-02-21.md'


2025-11-14 17:09:40,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:41,011 - INFO - Going to convert document batch...
2025-11-14 17:09:41,012 - INFO - Processing document 8-K_2024-05-22


Converted 'data\edgar_documents\MDLZ\8-K_2024-04-30' --> 'data\processed_data\MDLZ\8-K_2024-04-30.md'


2025-11-14 17:09:41,203 - INFO - Finished converting document 8-K_2024-05-22 in 0.36 sec.
2025-11-14 17:09:41,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:41,478 - INFO - Going to convert document batch...
2025-11-14 17:09:41,479 - INFO - Processing document 8-K_2024-05-23


Converted 'data\edgar_documents\MDLZ\8-K_2024-05-22' --> 'data\processed_data\MDLZ\8-K_2024-05-22.md'


2025-11-14 17:09:41,629 - INFO - Finished converting document 8-K_2024-05-23 in 0.30 sec.
2025-11-14 17:09:41,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:41,887 - INFO - Going to convert document batch...
2025-11-14 17:09:41,889 - INFO - Processing document 8-K_2024-07-01


Converted 'data\edgar_documents\MDLZ\8-K_2024-05-23' --> 'data\processed_data\MDLZ\8-K_2024-05-23.md'


2025-11-14 17:09:42,126 - INFO - Finished converting document 8-K_2024-07-01 in 0.36 sec.
2025-11-14 17:09:42,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:42,294 - INFO - Going to convert document batch...
2025-11-14 17:09:42,296 - INFO - Processing document 8-K_2024-07-03


Converted 'data\edgar_documents\MDLZ\8-K_2024-07-01' --> 'data\processed_data\MDLZ\8-K_2024-07-01.md'


2025-11-14 17:09:42,404 - INFO - Finished converting document 8-K_2024-07-03 in 0.23 sec.
2025-11-14 17:09:42,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\8-K_2024-07-03' --> 'data\processed_data\MDLZ\8-K_2024-07-03.md'


2025-11-14 17:09:42,667 - INFO - Going to convert document batch...
2025-11-14 17:09:42,670 - INFO - Processing document 8-K_2024-07-30
2025-11-14 17:09:42,780 - INFO - Finished converting document 8-K_2024-07-30 in 0.31 sec.
2025-11-14 17:09:42,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:42,944 - INFO - Going to convert document batch...
2025-11-14 17:09:42,946 - INFO - Processing document 8-K_2024-08-23
2025-11-14 17:09:43,023 - INFO - Finished converting document 8-K_2024-08-23 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2024-07-30' --> 'data\processed_data\MDLZ\8-K_2024-07-30.md'


2025-11-14 17:09:43,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:43,204 - INFO - Going to convert document batch...
2025-11-14 17:09:43,208 - INFO - Processing document 8-K_2024-08-28


Converted 'data\edgar_documents\MDLZ\8-K_2024-08-23' --> 'data\processed_data\MDLZ\8-K_2024-08-23.md'


2025-11-14 17:09:43,352 - INFO - Finished converting document 8-K_2024-08-28 in 0.27 sec.
2025-11-14 17:09:43,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:43,550 - INFO - Going to convert document batch...
2025-11-14 17:09:43,553 - INFO - Processing document 8-K_2024-10-29
2025-11-14 17:09:43,628 - INFO - Finished converting document 8-K_2024-10-29 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2024-08-28' --> 'data\processed_data\MDLZ\8-K_2024-08-28.md'


2025-11-14 17:09:43,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:43,810 - INFO - Going to convert document batch...
2025-11-14 17:09:43,812 - INFO - Processing document 8-K_2024-12-03


Converted 'data\edgar_documents\MDLZ\8-K_2024-10-29' --> 'data\processed_data\MDLZ\8-K_2024-10-29.md'


2025-11-14 17:09:43,990 - INFO - Finished converting document 8-K_2024-12-03 in 0.30 sec.
2025-11-14 17:09:44,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:44,176 - INFO - Going to convert document batch...
2025-11-14 17:09:44,178 - INFO - Processing document 8-K_2025-01-15


Converted 'data\edgar_documents\MDLZ\8-K_2024-12-03' --> 'data\processed_data\MDLZ\8-K_2024-12-03.md'


2025-11-14 17:09:44,330 - INFO - Finished converting document 8-K_2025-01-15 in 0.28 sec.
2025-11-14 17:09:44,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:44,516 - INFO - Going to convert document batch...
2025-11-14 17:09:44,518 - INFO - Processing document 8-K_2025-01-27
2025-11-14 17:09:44,574 - INFO - Finished converting document 8-K_2025-01-27 in 0.16 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2025-01-15' --> 'data\processed_data\MDLZ\8-K_2025-01-15.md'


2025-11-14 17:09:44,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:44,757 - INFO - Going to convert document batch...
2025-11-14 17:09:44,761 - INFO - Processing document 8-K_2025-02-04


Converted 'data\edgar_documents\MDLZ\8-K_2025-01-27' --> 'data\processed_data\MDLZ\8-K_2025-01-27.md'


2025-11-14 17:09:44,880 - INFO - Finished converting document 8-K_2025-02-04 in 0.27 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2025-02-04' --> 'data\processed_data\MDLZ\8-K_2025-02-04.md'


2025-11-14 17:09:45,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:45,312 - INFO - Going to convert document batch...
2025-11-14 17:09:45,314 - INFO - Processing document 8-K_2025-02-18
2025-11-14 17:09:45,387 - INFO - Finished converting document 8-K_2025-02-18 in 0.45 sec.
2025-11-14 17:09:45,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:45,565 - INFO - Going to convert document batch...
2025-11-14 17:09:45,567 - INFO - Processing document 8-K_2025-02-20
2025-11-14 17:09:45,650 - INFO - Finished converting document 8-K_2025-02-20 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2025-02-18' --> 'data\processed_data\MDLZ\8-K_2025-02-18.md'


2025-11-14 17:09:45,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:45,806 - INFO - Going to convert document batch...
2025-11-14 17:09:45,807 - INFO - Processing document 8-K_2025-04-29


Converted 'data\edgar_documents\MDLZ\8-K_2025-02-20' --> 'data\processed_data\MDLZ\8-K_2025-02-20.md'


2025-11-14 17:09:46,008 - INFO - Finished converting document 8-K_2025-04-29 in 0.30 sec.
2025-11-14 17:09:46,126 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:46,179 - INFO - Going to convert document batch...
2025-11-14 17:09:46,180 - INFO - Processing document 8-K_2025-05-06


Converted 'data\edgar_documents\MDLZ\8-K_2025-04-29' --> 'data\processed_data\MDLZ\8-K_2025-04-29.md'


2025-11-14 17:09:46,289 - INFO - Finished converting document 8-K_2025-05-06 in 0.22 sec.
2025-11-14 17:09:46,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:46,485 - INFO - Going to convert document batch...
2025-11-14 17:09:46,488 - INFO - Processing document 8-K_2025-05-27


Converted 'data\edgar_documents\MDLZ\8-K_2025-05-06' --> 'data\processed_data\MDLZ\8-K_2025-05-06.md'


2025-11-14 17:09:46,771 - INFO - Finished converting document 8-K_2025-05-27 in 0.39 sec.
2025-11-14 17:09:46,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:09:46,996 - INFO - Going to convert document batch...
2025-11-14 17:09:46,999 - INFO - Processing document 8-K_2025-07-29
2025-11-14 17:09:47,087 - INFO - Finished converting document 8-K_2025-07-29 in 0.19 sec.


Converted 'data\edgar_documents\MDLZ\8-K_2025-05-27' --> 'data\processed_data\MDLZ\8-K_2025-05-27.md'


2025-11-14 17:09:47,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\8-K_2025-07-29' --> 'data\processed_data\MDLZ\8-K_2025-07-29.md'


2025-11-14 17:09:47,365 - INFO - Going to convert document batch...
2025-11-14 17:09:47,368 - INFO - Processing document 8-K_2025-10-28
2025-11-14 17:09:47,437 - INFO - Finished converting document 8-K_2025-10-28 in 0.30 sec.
2025-11-14 17:09:47,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\8-K_2025-10-28' --> 'data\processed_data\MDLZ\8-K_2025-10-28.md'


2025-11-14 17:09:50,291 - INFO - Going to convert document batch...
2025-11-14 17:09:50,293 - INFO - Processing document DEF-14A_2023-04-06
2025-11-14 17:09:58,034 - INFO - Finished converting document DEF-14A_2023-04-06 in 10.56 sec.
2025-11-14 17:10:02,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDLZ\DEF-14A_2023-04-06' --> 'data\processed_data\MDLZ\DEF-14A_2023-04-06.md'


2025-11-14 17:10:05,302 - INFO - Going to convert document batch...
2025-11-14 17:10:05,304 - INFO - Processing document DEF-14A_2024-04-05
2025-11-14 17:10:11,976 - INFO - Finished converting document DEF-14A_2024-04-05 in 9.50 sec.


Converted 'data\edgar_documents\MDLZ\DEF-14A_2024-04-05' --> 'data\processed_data\MDLZ\DEF-14A_2024-04-05.md'


2025-11-14 17:10:18,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:10:23,674 - INFO - Going to convert document batch...
2025-11-14 17:10:23,676 - INFO - Processing document DEF-14A_2025-04-04
2025-11-14 17:10:45,127 - INFO - Finished converting document DEF-14A_2025-04-04 in 26.97 sec.


Converted 'data\edgar_documents\MDLZ\DEF-14A_2025-04-04' --> 'data\processed_data\MDLZ\DEF-14A_2025-04-04.md'
Processed 75 new files. Errors: 8
Found 95 files to process in data\edgar_documents\MDT


2025-11-14 17:10:48,667 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:10:51,884 - INFO - Going to convert document batch...
2025-11-14 17:10:51,886 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:10:51,887 - INFO - Processing document 10-K_2023-06-22
2025-11-14 17:11:00,381 - INFO - Finished converting document 10-K_2023-06-22 in 11.88 sec.
2025-11-14 17:11:03,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\10-K_2023-06-22' --> 'data\processed_data\MDT\10-K_2023-06-22.md'


2025-11-14 17:11:07,534 - INFO - Going to convert document batch...
2025-11-14 17:11:07,540 - INFO - Processing document 10-K_2024-06-20
2025-11-14 17:11:15,259 - INFO - Finished converting document 10-K_2024-06-20 in 12.03 sec.


Converted 'data\edgar_documents\MDT\10-K_2024-06-20' --> 'data\processed_data\MDT\10-K_2024-06-20.md'


2025-11-14 17:11:18,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:11:22,556 - INFO - Going to convert document batch...
2025-11-14 17:11:22,559 - INFO - Processing document 10-K_2025-06-20
2025-11-14 17:11:30,477 - INFO - Finished converting document 10-K_2025-06-20 in 12.24 sec.
2025-11-14 17:11:33,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\10-K_2025-06-20' --> 'data\processed_data\MDT\10-K_2025-06-20.md'


2025-11-14 17:11:36,795 - INFO - Going to convert document batch...
2025-11-14 17:11:36,798 - INFO - Processing document 10-Q_2023-03-01
2025-11-14 17:11:41,207 - INFO - Finished converting document 10-Q_2023-03-01 in 7.66 sec.
2025-11-14 17:11:43,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\10-Q_2023-03-01' --> 'data\processed_data\MDT\10-Q_2023-03-01.md'


2025-11-14 17:11:46,131 - INFO - Going to convert document batch...
2025-11-14 17:11:46,133 - INFO - Processing document 10-Q_2023-08-31
2025-11-14 17:11:49,596 - INFO - Finished converting document 10-Q_2023-08-31 in 6.39 sec.


Converted 'data\edgar_documents\MDT\10-Q_2023-08-31' --> 'data\processed_data\MDT\10-Q_2023-08-31.md'


2025-11-14 17:11:51,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:11:53,988 - INFO - Going to convert document batch...
2025-11-14 17:11:53,990 - INFO - Processing document 10-Q_2023-11-30
2025-11-14 17:11:57,952 - INFO - Finished converting document 10-Q_2023-11-30 in 6.70 sec.
2025-11-14 17:12:00,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\10-Q_2023-11-30' --> 'data\processed_data\MDT\10-Q_2023-11-30.md'


2025-11-14 17:12:03,066 - INFO - Going to convert document batch...
2025-11-14 17:12:03,069 - INFO - Processing document 10-Q_2024-02-27
2025-11-14 17:12:06,845 - INFO - Finished converting document 10-Q_2024-02-27 in 6.33 sec.
2025-11-14 17:12:08,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\10-Q_2024-02-27' --> 'data\processed_data\MDT\10-Q_2024-02-27.md'


2025-11-14 17:12:11,563 - INFO - Going to convert document batch...
2025-11-14 17:12:11,565 - INFO - Processing document 10-Q_2024-08-27
2025-11-14 17:12:15,061 - INFO - Finished converting document 10-Q_2024-08-27 in 6.22 sec.


Converted 'data\edgar_documents\MDT\10-Q_2024-08-27' --> 'data\processed_data\MDT\10-Q_2024-08-27.md'


2025-11-14 17:12:16,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:19,994 - INFO - Going to convert document batch...
2025-11-14 17:12:19,998 - INFO - Processing document 10-Q_2024-11-26
2025-11-14 17:12:23,811 - INFO - Finished converting document 10-Q_2024-11-26 in 7.11 sec.
2025-11-14 17:12:25,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\10-Q_2024-11-26' --> 'data\processed_data\MDT\10-Q_2024-11-26.md'


2025-11-14 17:12:27,923 - INFO - Going to convert document batch...
2025-11-14 17:12:27,926 - INFO - Processing document 10-Q_2025-02-25
2025-11-14 17:12:32,881 - INFO - Finished converting document 10-Q_2025-02-25 in 7.27 sec.
2025-11-14 17:12:35,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\10-Q_2025-02-25' --> 'data\processed_data\MDT\10-Q_2025-02-25.md'


2025-11-14 17:12:36,910 - INFO - Going to convert document batch...
2025-11-14 17:12:36,913 - INFO - Processing document 10-Q_2025-08-26
2025-11-14 17:12:40,471 - INFO - Finished converting document 10-Q_2025-08-26 in 5.59 sec.
2025-11-14 17:12:42,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:42,981 - INFO - Going to convert document batch...
2025-11-14 17:12:42,983 - INFO - Processing document 4_2023-02-01
2025-11-14 17:12:43,051 - INFO - Finished converting document 4_2023-02-01 in 0.16 sec.


Converted 'data\edgar_documents\MDT\10-Q_2025-08-26' --> 'data\processed_data\MDT\10-Q_2025-08-26.md'


2025-11-14 17:12:43,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:43,196 - INFO - Going to convert document batch...
2025-11-14 17:12:43,199 - INFO - Processing document 4_2023-02-02
2025-11-14 17:12:43,277 - INFO - Finished converting document 4_2023-02-02 in 0.16 sec.


Converted 'data\edgar_documents\MDT\4_2023-02-01' --> 'data\processed_data\MDT\4_2023-02-01.md'


2025-11-14 17:12:43,424 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:12:43,427 - ERROR - Input document 4_2023-03-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:12:43,432 - INFO - Going to convert document batch...
2025-11-14 17:12:43,495 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:12:43,497 - ERROR - Input document 4_2023-03-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\MDT\4_2023-02-02' --> 'data\processed_data\MDT\4_2023-02-02.md'
Error processing data\edgar_documents\MDT\4_2023-03-23: File format not allowed: data\edgar_documents\MDT\4_2023-03-23
Error processing data\edgar_documents\MDT\4_2023-03-24: File format not allowed: data\edgar_documents\MDT\4_2023-03-24


2025-11-14 17:12:43,609 - INFO - Going to convert document batch...
2025-11-14 17:12:43,612 - INFO - Processing document 4_2023-04-07
2025-11-14 17:12:43,746 - INFO - Finished converting document 4_2023-04-07 in 0.25 sec.
2025-11-14 17:12:43,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:43,935 - INFO - Going to convert document batch...
2025-11-14 17:12:43,937 - INFO - Processing document 4_2023-04-20
2025-11-14 17:12:44,016 - INFO - Finished converting document 4_2023-04-20 in 0.17 sec.


Converted 'data\edgar_documents\MDT\4_2023-04-07' --> 'data\processed_data\MDT\4_2023-04-07.md'


2025-11-14 17:12:44,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:44,219 - INFO - Going to convert document batch...
2025-11-14 17:12:44,222 - INFO - Processing document 4_2023-05-03


Converted 'data\edgar_documents\MDT\4_2023-04-20' --> 'data\processed_data\MDT\4_2023-04-20.md'


2025-11-14 17:12:44,325 - INFO - Finished converting document 4_2023-05-03 in 0.22 sec.
2025-11-14 17:12:44,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\4_2023-05-03' --> 'data\processed_data\MDT\4_2023-05-03.md'


2025-11-14 17:12:44,635 - INFO - Going to convert document batch...
2025-11-14 17:12:44,640 - INFO - Processing document 4_2023-07-12
2025-11-14 17:12:44,747 - INFO - Finished converting document 4_2023-07-12 in 0.33 sec.
2025-11-14 17:12:44,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:44,934 - INFO - Going to convert document batch...
2025-11-14 17:12:44,937 - INFO - Processing document 4_2023-07-18
2025-11-14 17:12:45,010 - INFO - Finished converting document 4_2023-07-18 in 0.12 sec.


Converted 'data\edgar_documents\MDT\4_2023-07-12' --> 'data\processed_data\MDT\4_2023-07-12.md'


2025-11-14 17:12:45,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:45,185 - INFO - Going to convert document batch...
2025-11-14 17:12:45,188 - INFO - Processing document 4_2023-08-02


Converted 'data\edgar_documents\MDT\4_2023-07-18' --> 'data\processed_data\MDT\4_2023-07-18.md'


2025-11-14 17:12:45,282 - INFO - Finished converting document 4_2023-08-02 in 0.20 sec.
2025-11-14 17:12:45,521 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:45,569 - INFO - Going to convert document batch...
2025-11-14 17:12:45,571 - INFO - Processing document 4_2023-08-07


Converted 'data\edgar_documents\MDT\4_2023-08-02' --> 'data\processed_data\MDT\4_2023-08-02.md'


2025-11-14 17:12:45,661 - INFO - Finished converting document 4_2023-08-07 in 0.20 sec.
2025-11-14 17:12:45,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:45,825 - INFO - Going to convert document batch...
2025-11-14 17:12:45,827 - INFO - Processing document 4_2023-08-16
2025-11-14 17:12:45,921 - INFO - Finished converting document 4_2023-08-16 in 0.17 sec.


Converted 'data\edgar_documents\MDT\4_2023-08-07' --> 'data\processed_data\MDT\4_2023-08-07.md'


2025-11-14 17:12:46,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:46,143 - INFO - Going to convert document batch...
2025-11-14 17:12:46,145 - INFO - Processing document 4_2023-08-25


Converted 'data\edgar_documents\MDT\4_2023-08-16' --> 'data\processed_data\MDT\4_2023-08-16.md'


2025-11-14 17:12:46,253 - INFO - Finished converting document 4_2023-08-25 in 0.22 sec.
2025-11-14 17:12:46,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:46,409 - INFO - Going to convert document batch...
2025-11-14 17:12:46,412 - INFO - Processing document 4_2023-11-01


Converted 'data\edgar_documents\MDT\4_2023-08-25' --> 'data\processed_data\MDT\4_2023-08-25.md'


2025-11-14 17:12:46,584 - INFO - Finished converting document 4_2023-11-01 in 0.23 sec.
2025-11-14 17:12:46,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:46,768 - INFO - Going to convert document batch...
2025-11-14 17:12:46,770 - INFO - Processing document 4_2023-12-12
2025-11-14 17:12:46,851 - INFO - Finished converting document 4_2023-12-12 in 0.17 sec.


Converted 'data\edgar_documents\MDT\4_2023-11-01' --> 'data\processed_data\MDT\4_2023-11-01.md'


2025-11-14 17:12:47,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:47,034 - INFO - Going to convert document batch...
2025-11-14 17:12:47,037 - INFO - Processing document 4_2023-12-20
2025-11-14 17:12:47,125 - INFO - Finished converting document 4_2023-12-20 in 0.19 sec.


Converted 'data\edgar_documents\MDT\4_2023-12-12' --> 'data\processed_data\MDT\4_2023-12-12.md'


2025-11-14 17:12:47,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\4_2023-12-20' --> 'data\processed_data\MDT\4_2023-12-20.md'


2025-11-14 17:12:48,312 - INFO - Going to convert document batch...
2025-11-14 17:12:48,317 - INFO - Processing document 4_2024-02-02
2025-11-14 17:12:48,411 - INFO - Finished converting document 4_2024-02-02 in 1.14 sec.
2025-11-14 17:12:48,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:48,648 - INFO - Going to convert document batch...
2025-11-14 17:12:48,651 - INFO - Processing document 4_2024-02-23


Converted 'data\edgar_documents\MDT\4_2024-02-02' --> 'data\processed_data\MDT\4_2024-02-02.md'


2025-11-14 17:12:48,829 - INFO - Finished converting document 4_2024-02-23 in 0.31 sec.
2025-11-14 17:12:49,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:49,156 - INFO - Going to convert document batch...
2025-11-14 17:12:49,159 - INFO - Processing document 4_2024-03-07
2025-11-14 17:12:49,234 - INFO - Finished converting document 4_2024-03-07 in 0.20 sec.


Converted 'data\edgar_documents\MDT\4_2024-02-23' --> 'data\processed_data\MDT\4_2024-02-23.md'


2025-11-14 17:12:49,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:49,393 - INFO - Going to convert document batch...
2025-11-14 17:12:49,395 - INFO - Processing document 4_2024-04-09
2025-11-14 17:12:49,476 - INFO - Finished converting document 4_2024-04-09 in 0.16 sec.


Converted 'data\edgar_documents\MDT\4_2024-03-07' --> 'data\processed_data\MDT\4_2024-03-07.md'


2025-11-14 17:12:49,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:49,669 - INFO - Going to convert document batch...
2025-11-14 17:12:49,672 - INFO - Processing document 4_2024-05-01


Converted 'data\edgar_documents\MDT\4_2024-04-09' --> 'data\processed_data\MDT\4_2024-04-09.md'


2025-11-14 17:12:49,785 - INFO - Finished converting document 4_2024-05-01 in 0.23 sec.
2025-11-14 17:12:49,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:49,937 - INFO - Going to convert document batch...
2025-11-14 17:12:49,940 - INFO - Processing document 4_2024-05-03
2025-11-14 17:12:50,015 - INFO - Finished converting document 4_2024-05-03 in 0.14 sec.


Converted 'data\edgar_documents\MDT\4_2024-05-01' --> 'data\processed_data\MDT\4_2024-05-01.md'


2025-11-14 17:12:50,259 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:12:50,260 - ERROR - Input document 4_2024-05-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:12:50,266 - INFO - Going to convert document batch...
2025-11-14 17:12:50,347 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:12:50,349 - ERROR - Input document 4_2024-05-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\MDT\4_2024-05-03' --> 'data\processed_data\MDT\4_2024-05-03.md'
Error processing data\edgar_documents\MDT\4_2024-05-29: File format not allowed: data\edgar_documents\MDT\4_2024-05-29
Error processing data\edgar_documents\MDT\4_2024-05-30: File format not allowed: data\edgar_documents\MDT\4_2024-05-30


2025-11-14 17:12:50,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:50,439 - INFO - Going to convert document batch...
2025-11-14 17:12:50,442 - INFO - Processing document 4_2024-06-11
2025-11-14 17:12:50,542 - INFO - Finished converting document 4_2024-06-11 in 0.19 sec.
2025-11-14 17:12:50,707 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:50,749 - INFO - Going to convert document batch...
2025-11-14 17:12:50,751 - INFO - Processing document 4_2024-07-19
2025-11-14 17:12:50,836 - INFO - Finished converting document 4_2024-07-19 in 0.19 sec.


Converted 'data\edgar_documents\MDT\4_2024-06-11' --> 'data\processed_data\MDT\4_2024-06-11.md'


2025-11-14 17:12:50,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:50,982 - INFO - Going to convert document batch...
2025-11-14 17:12:50,984 - INFO - Processing document 4_2024-07-31
2025-11-14 17:12:51,078 - INFO - Finished converting document 4_2024-07-31 in 0.17 sec.


Converted 'data\edgar_documents\MDT\4_2024-07-19' --> 'data\processed_data\MDT\4_2024-07-19.md'


2025-11-14 17:12:51,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:51,275 - INFO - Going to convert document batch...
2025-11-14 17:12:51,277 - INFO - Processing document 4_2024-08-02
2025-11-14 17:12:51,344 - INFO - Finished converting document 4_2024-08-02 in 0.16 sec.


Converted 'data\edgar_documents\MDT\4_2024-07-31' --> 'data\processed_data\MDT\4_2024-07-31.md'


2025-11-14 17:12:51,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:51,532 - INFO - Going to convert document batch...
2025-11-14 17:12:51,534 - INFO - Processing document 4_2024-08-06


Converted 'data\edgar_documents\MDT\4_2024-08-02' --> 'data\processed_data\MDT\4_2024-08-02.md'


2025-11-14 17:12:51,635 - INFO - Finished converting document 4_2024-08-06 in 0.20 sec.
2025-11-14 17:12:51,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:51,818 - INFO - Going to convert document batch...
2025-11-14 17:12:51,822 - INFO - Processing document 4_2024-08-19
2025-11-14 17:12:51,909 - INFO - Finished converting document 4_2024-08-19 in 0.16 sec.


Converted 'data\edgar_documents\MDT\4_2024-08-06' --> 'data\processed_data\MDT\4_2024-08-06.md'


2025-11-14 17:12:52,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:52,089 - INFO - Going to convert document batch...
2025-11-14 17:12:52,090 - INFO - Processing document 4_2024-08-21
2025-11-14 17:12:52,164 - INFO - Finished converting document 4_2024-08-21 in 0.17 sec.


Converted 'data\edgar_documents\MDT\4_2024-08-19' --> 'data\processed_data\MDT\4_2024-08-19.md'


2025-11-14 17:12:52,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:52,356 - INFO - Going to convert document batch...
2025-11-14 17:12:52,358 - INFO - Processing document 4_2024-12-09
2025-11-14 17:12:52,443 - INFO - Finished converting document 4_2024-12-09 in 0.19 sec.


Converted 'data\edgar_documents\MDT\4_2024-08-21' --> 'data\processed_data\MDT\4_2024-08-21.md'


2025-11-14 17:12:52,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:52,600 - INFO - Going to convert document batch...
2025-11-14 17:12:52,604 - INFO - Processing document 4_2024-12-10
2025-11-14 17:12:52,714 - INFO - Finished converting document 4_2024-12-10 in 0.19 sec.


Converted 'data\edgar_documents\MDT\4_2024-12-09' --> 'data\processed_data\MDT\4_2024-12-09.md'


2025-11-14 17:12:52,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:52,941 - INFO - Going to convert document batch...
2025-11-14 17:12:52,943 - INFO - Processing document 4_2024-12-11
2025-11-14 17:12:53,013 - INFO - Finished converting document 4_2024-12-11 in 0.19 sec.


Converted 'data\edgar_documents\MDT\4_2024-12-10' --> 'data\processed_data\MDT\4_2024-12-10.md'


2025-11-14 17:12:53,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:53,176 - INFO - Going to convert document batch...
2025-11-14 17:12:53,178 - INFO - Processing document 4_2024-12-17
2025-11-14 17:12:53,266 - INFO - Finished converting document 4_2024-12-17 in 0.16 sec.


Converted 'data\edgar_documents\MDT\4_2024-12-11' --> 'data\processed_data\MDT\4_2024-12-11.md'


2025-11-14 17:12:53,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:53,448 - INFO - Going to convert document batch...
2025-11-14 17:12:53,452 - INFO - Processing document 4_2025-01-10


Converted 'data\edgar_documents\MDT\4_2024-12-17' --> 'data\processed_data\MDT\4_2024-12-17.md'


2025-11-14 17:12:53,632 - INFO - Finished converting document 4_2025-01-10 in 0.28 sec.
2025-11-14 17:12:53,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:53,839 - INFO - Going to convert document batch...
2025-11-14 17:12:53,841 - INFO - Processing document 4_2025-01-23
2025-11-14 17:12:53,920 - INFO - Finished converting document 4_2025-01-23 in 0.17 sec.


Converted 'data\edgar_documents\MDT\4_2025-01-10' --> 'data\processed_data\MDT\4_2025-01-10.md'


2025-11-14 17:12:54,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:54,105 - INFO - Going to convert document batch...
2025-11-14 17:12:54,108 - INFO - Processing document 4_2025-01-27
2025-11-14 17:12:54,193 - INFO - Finished converting document 4_2025-01-27 in 0.19 sec.


Converted 'data\edgar_documents\MDT\4_2025-01-23' --> 'data\processed_data\MDT\4_2025-01-23.md'


2025-11-14 17:12:54,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:54,338 - INFO - Going to convert document batch...
2025-11-14 17:12:54,341 - INFO - Processing document 4_2025-01-28
2025-11-14 17:12:54,436 - INFO - Finished converting document 4_2025-01-28 in 0.17 sec.


Converted 'data\edgar_documents\MDT\4_2025-01-27' --> 'data\processed_data\MDT\4_2025-01-27.md'


2025-11-14 17:12:54,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:54,619 - INFO - Going to convert document batch...
2025-11-14 17:12:54,620 - INFO - Processing document 4_2025-03-05
2025-11-14 17:12:54,713 - INFO - Finished converting document 4_2025-03-05 in 0.17 sec.


Converted 'data\edgar_documents\MDT\4_2025-01-28' --> 'data\processed_data\MDT\4_2025-01-28.md'


2025-11-14 17:12:54,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:54,898 - INFO - Going to convert document batch...
2025-11-14 17:12:54,900 - INFO - Processing document 4_2025-03-10


Converted 'data\edgar_documents\MDT\4_2025-03-05' --> 'data\processed_data\MDT\4_2025-03-05.md'


2025-11-14 17:12:55,002 - INFO - Finished converting document 4_2025-03-10 in 0.20 sec.
2025-11-14 17:12:55,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:55,198 - INFO - Going to convert document batch...
2025-11-14 17:12:55,200 - INFO - Processing document 4_2025-04-30
2025-11-14 17:12:55,275 - INFO - Finished converting document 4_2025-04-30 in 0.16 sec.


Converted 'data\edgar_documents\MDT\4_2025-03-10' --> 'data\processed_data\MDT\4_2025-03-10.md'


2025-11-14 17:12:55,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:55,454 - INFO - Going to convert document batch...
2025-11-14 17:12:55,456 - INFO - Processing document 4_2025-05-05
2025-11-14 17:12:55,522 - INFO - Finished converting document 4_2025-05-05 in 0.16 sec.


Converted 'data\edgar_documents\MDT\4_2025-04-30' --> 'data\processed_data\MDT\4_2025-04-30.md'


2025-11-14 17:12:55,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:55,704 - INFO - Going to convert document batch...
2025-11-14 17:12:55,706 - INFO - Processing document 4_2025-06-04
2025-11-14 17:12:55,780 - INFO - Finished converting document 4_2025-06-04 in 0.17 sec.


Converted 'data\edgar_documents\MDT\4_2025-05-05' --> 'data\processed_data\MDT\4_2025-05-05.md'


2025-11-14 17:12:55,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:55,990 - INFO - Going to convert document batch...
2025-11-14 17:12:55,992 - INFO - Processing document 4_2025-07-30


Converted 'data\edgar_documents\MDT\4_2025-06-04' --> 'data\processed_data\MDT\4_2025-06-04.md'


2025-11-14 17:12:56,110 - INFO - Finished converting document 4_2025-07-30 in 0.23 sec.
2025-11-14 17:12:56,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:56,302 - INFO - Going to convert document batch...
2025-11-14 17:12:56,304 - INFO - Processing document 4_2025-08-01
2025-11-14 17:12:56,391 - INFO - Finished converting document 4_2025-08-01 in 0.19 sec.


Converted 'data\edgar_documents\MDT\4_2025-07-30' --> 'data\processed_data\MDT\4_2025-07-30.md'


2025-11-14 17:12:56,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:56,595 - INFO - Going to convert document batch...
2025-11-14 17:12:56,598 - INFO - Processing document 4_2025-08-04


Converted 'data\edgar_documents\MDT\4_2025-08-01' --> 'data\processed_data\MDT\4_2025-08-01.md'


2025-11-14 17:12:56,748 - INFO - Finished converting document 4_2025-08-04 in 0.27 sec.
2025-11-14 17:12:56,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:56,942 - INFO - Going to convert document batch...
2025-11-14 17:12:56,944 - INFO - Processing document 4_2025-08-21
2025-11-14 17:12:57,041 - INFO - Finished converting document 4_2025-08-21 in 0.16 sec.


Converted 'data\edgar_documents\MDT\4_2025-08-04' --> 'data\processed_data\MDT\4_2025-08-04.md'


2025-11-14 17:12:57,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:57,154 - INFO - Going to convert document batch...
2025-11-14 17:12:57,155 - INFO - Processing document 4_2025-08-25
2025-11-14 17:12:57,297 - INFO - Finished converting document 4_2025-08-25 in 0.19 sec.


Converted 'data\edgar_documents\MDT\4_2025-08-21' --> 'data\processed_data\MDT\4_2025-08-21.md'


2025-11-14 17:12:57,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:57,385 - INFO - Going to convert document batch...
2025-11-14 17:12:57,386 - INFO - Processing document 4_2025-09-05
2025-11-14 17:12:57,425 - INFO - Finished converting document 4_2025-09-05 in 0.08 sec.
2025-11-14 17:12:57,541 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\MDT\4_2025-08-25' --> 'data\processed_data\MDT\4_2025-08-25.md'
Converted 'data\edgar_documents\MDT\4_2025-09-05' --> 'data\processed_data\MDT\4_2025-09-05.md'


2025-11-14 17:12:57,544 - ERROR - Input document 4_2025-09-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:12:57,549 - INFO - Going to convert document batch...
2025-11-14 17:12:57,598 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:12:57,600 - ERROR - Input document 4_2025-09-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\MDT\4_2025-09-15: File format not allowed: data\edgar_documents\MDT\4_2025-09-15
Error processing data\edgar_documents\MDT\4_2025-09-16: File format not allowed: data\edgar_documents\MDT\4_2025-09-16


2025-11-14 17:12:57,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:57,805 - INFO - Going to convert document batch...
2025-11-14 17:12:57,807 - INFO - Processing document 8-K_2023-03-07
2025-11-14 17:12:57,855 - INFO - Finished converting document 8-K_2023-03-07 in 0.11 sec.
2025-11-14 17:12:57,898 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:57,923 - INFO - Going to convert document batch...
2025-11-14 17:12:57,924 - INFO - Processing document 8-K_2023-03-09
2025-11-14 17:12:57,951 - INFO - Finished converting document 8-K_2023-03-09 in 0.08 sec.


Converted 'data\edgar_documents\MDT\8-K_2023-02-21' --> 'data\processed_data\MDT\8-K_2023-02-21.md'
Converted 'data\edgar_documents\MDT\8-K_2023-03-07' --> 'data\processed_data\MDT\8-K_2023-03-07.md'


2025-11-14 17:12:57,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:58,007 - INFO - Going to convert document batch...
2025-11-14 17:12:58,008 - INFO - Processing document 8-K_2023-03-30
2025-11-14 17:12:58,041 - INFO - Finished converting document 8-K_2023-03-30 in 0.08 sec.
2025-11-14 17:12:58,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:58,142 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MDT\8-K_2023-03-09' --> 'data\processed_data\MDT\8-K_2023-03-09.md'
Converted 'data\edgar_documents\MDT\8-K_2023-03-30' --> 'data\processed_data\MDT\8-K_2023-03-30.md'


2025-11-14 17:12:58,143 - INFO - Processing document 8-K_2023-05-25
2025-11-14 17:12:58,175 - INFO - Finished converting document 8-K_2023-05-25 in 0.09 sec.
2025-11-14 17:12:58,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:58,232 - INFO - Going to convert document batch...
2025-11-14 17:12:58,233 - INFO - Processing document 8-K_2023-06-26
2025-11-14 17:12:58,264 - INFO - Finished converting document 8-K_2023-06-26 in 0.08 sec.
2025-11-14 17:12:58,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:58,314 - INFO - Going to convert document batch...
2025-11-14 17:12:58,315 - INFO - Processing document 8-K_2023-08-22
2025-11-14 17:12:58,347 - INFO - Finished converting document 8-K_2023-08-22 in 0.06 sec.
2025-11-14 17:12:58,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\8-K_2023-05-25' --> 'data\processed_data\MDT\8-K_2023-05-25.md'
Converted 'data\edgar_documents\MDT\8-K_2023-06-26' --> 'data\processed_data\MDT\8-K_2023-06-26.md'
Converted 'data\edgar_documents\MDT\8-K_2023-08-22' --> 'data\processed_data\MDT\8-K_2023-08-22.md'


2025-11-14 17:12:58,407 - INFO - Going to convert document batch...
2025-11-14 17:12:58,408 - INFO - Processing document 8-K_2023-10-23
2025-11-14 17:12:58,478 - INFO - Finished converting document 8-K_2023-10-23 in 0.11 sec.
2025-11-14 17:12:58,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:58,545 - INFO - Going to convert document batch...
2025-11-14 17:12:58,546 - INFO - Processing document 8-K_2023-11-21
2025-11-14 17:12:58,574 - INFO - Finished converting document 8-K_2023-11-21 in 0.08 sec.
2025-11-14 17:12:58,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:58,619 - INFO - Going to convert document batch...
2025-11-14 17:12:58,620 - INFO - Processing document 8-K_2023-12-06
2025-11-14 17:12:58,644 - INFO - Finished converting document 8-K_2023-12-06 in 0.05 sec.
2025-11-14 17:12:58,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\8-K_2023-10-23' --> 'data\processed_data\MDT\8-K_2023-10-23.md'
Converted 'data\edgar_documents\MDT\8-K_2023-11-21' --> 'data\processed_data\MDT\8-K_2023-11-21.md'
Converted 'data\edgar_documents\MDT\8-K_2023-12-06' --> 'data\processed_data\MDT\8-K_2023-12-06.md'


2025-11-14 17:12:58,711 - INFO - Going to convert document batch...
2025-11-14 17:12:58,712 - INFO - Processing document 8-K_2024-02-20
2025-11-14 17:12:58,746 - INFO - Finished converting document 8-K_2024-02-20 in 0.09 sec.
2025-11-14 17:12:58,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:58,794 - INFO - Going to convert document batch...
2025-11-14 17:12:58,795 - INFO - Processing document 8-K_2024-05-23
2025-11-14 17:12:58,825 - INFO - Finished converting document 8-K_2024-05-23 in 0.06 sec.
2025-11-14 17:12:58,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:58,868 - INFO - Going to convert document batch...
2025-11-14 17:12:58,869 - INFO - Processing document 8-K_2024-06-03
2025-11-14 17:12:58,898 - INFO - Finished converting document 8-K_2024-06-03 in 0.06 sec.
2025-11-14 17:12:58,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:58,942 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\MDT\8-K_2024-02-20' --> 'data\processed_data\MDT\8-K_2024-02-20.md'
Converted 'data\edgar_documents\MDT\8-K_2024-05-23' --> 'data\processed_data\MDT\8-K_2024-05-23.md'
Converted 'data\edgar_documents\MDT\8-K_2024-06-03' --> 'data\processed_data\MDT\8-K_2024-06-03.md'


2025-11-14 17:12:59,181 - INFO - Finished converting document 8-K_2024-06-04 in 0.27 sec.
2025-11-14 17:12:59,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:59,245 - INFO - Going to convert document batch...
2025-11-14 17:12:59,246 - INFO - Processing document 8-K_2024-06-26
2025-11-14 17:12:59,290 - INFO - Finished converting document 8-K_2024-06-26 in 0.09 sec.
2025-11-14 17:12:59,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:59,334 - INFO - Going to convert document batch...
2025-11-14 17:12:59,335 - INFO - Processing document 8-K_2024-08-16
2025-11-14 17:12:59,360 - INFO - Finished converting document 8-K_2024-08-16 in 0.06 sec.


Converted 'data\edgar_documents\MDT\8-K_2024-06-04' --> 'data\processed_data\MDT\8-K_2024-06-04.md'
Converted 'data\edgar_documents\MDT\8-K_2024-06-26' --> 'data\processed_data\MDT\8-K_2024-06-26.md'


2025-11-14 17:12:59,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:59,407 - INFO - Going to convert document batch...
2025-11-14 17:12:59,408 - INFO - Processing document 8-K_2024-08-20
2025-11-14 17:12:59,442 - INFO - Finished converting document 8-K_2024-08-20 in 0.06 sec.
2025-11-14 17:12:59,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:59,501 - INFO - Going to convert document batch...
2025-11-14 17:12:59,502 - INFO - Processing document 8-K_2024-10-21
2025-11-14 17:12:59,548 - INFO - Finished converting document 8-K_2024-10-21 in 0.09 sec.


Converted 'data\edgar_documents\MDT\8-K_2024-08-16' --> 'data\processed_data\MDT\8-K_2024-08-16.md'
Converted 'data\edgar_documents\MDT\8-K_2024-08-20' --> 'data\processed_data\MDT\8-K_2024-08-20.md'


2025-11-14 17:12:59,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:59,600 - INFO - Going to convert document batch...
2025-11-14 17:12:59,601 - INFO - Processing document 8-K_2024-11-19
2025-11-14 17:12:59,646 - INFO - Finished converting document 8-K_2024-11-19 in 0.08 sec.
2025-11-14 17:12:59,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:59,729 - INFO - Going to convert document batch...
2025-11-14 17:12:59,730 - INFO - Processing document 8-K_2025-01-21


Converted 'data\edgar_documents\MDT\8-K_2024-10-21' --> 'data\processed_data\MDT\8-K_2024-10-21.md'
Converted 'data\edgar_documents\MDT\8-K_2024-11-19' --> 'data\processed_data\MDT\8-K_2024-11-19.md'


2025-11-14 17:12:59,769 - INFO - Finished converting document 8-K_2025-01-21 in 0.09 sec.
2025-11-14 17:12:59,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:59,850 - INFO - Going to convert document batch...
2025-11-14 17:12:59,851 - INFO - Processing document 8-K_2025-02-18
2025-11-14 17:12:59,898 - INFO - Finished converting document 8-K_2025-02-18 in 0.09 sec.
2025-11-14 17:12:59,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:12:59,978 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MDT\8-K_2025-01-21' --> 'data\processed_data\MDT\8-K_2025-01-21.md'
Converted 'data\edgar_documents\MDT\8-K_2025-02-18' --> 'data\processed_data\MDT\8-K_2025-02-18.md'


2025-11-14 17:12:59,980 - INFO - Processing document 8-K_2025-03-17
2025-11-14 17:13:00,037 - INFO - Finished converting document 8-K_2025-03-17 in 0.11 sec.
2025-11-14 17:13:00,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:13:00,086 - INFO - Going to convert document batch...
2025-11-14 17:13:00,087 - INFO - Processing document 8-K_2025-05-21
2025-11-14 17:13:00,120 - INFO - Finished converting document 8-K_2025-05-21 in 0.08 sec.
2025-11-14 17:13:00,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:13:00,171 - INFO - Going to convert document batch...
2025-11-14 17:13:00,171 - INFO - Processing document 8-K_2025-06-23
2025-11-14 17:13:00,203 - INFO - Finished converting document 8-K_2025-06-23 in 0.06 sec.


Converted 'data\edgar_documents\MDT\8-K_2025-03-17' --> 'data\processed_data\MDT\8-K_2025-03-17.md'
Converted 'data\edgar_documents\MDT\8-K_2025-05-21' --> 'data\processed_data\MDT\8-K_2025-05-21.md'
Converted 'data\edgar_documents\MDT\8-K_2025-06-23' --> 'data\processed_data\MDT\8-K_2025-06-23.md'


2025-11-14 17:13:00,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:13:00,255 - INFO - Going to convert document batch...
2025-11-14 17:13:00,256 - INFO - Processing document 8-K_2025-08-19
2025-11-14 17:13:00,291 - INFO - Finished converting document 8-K_2025-08-19 in 0.06 sec.
2025-11-14 17:13:00,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:13:00,338 - INFO - Going to convert document batch...
2025-11-14 17:13:00,339 - INFO - Processing document 8-K_2025-09-16
2025-11-14 17:13:00,363 - INFO - Finished converting document 8-K_2025-09-16 in 0.05 sec.
2025-11-14 17:13:00,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:13:00,431 - INFO - Going to convert document batch...
2025-11-14 17:13:00,431 - INFO - Processing document 8-K_2025-09-29
2025-11-14 17:13:00,463 - INFO - Finished converting document 8-K_2025-09-29 in 0.08 sec.
2025-11-14 17:13:00,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\8-K_2025-08-19' --> 'data\processed_data\MDT\8-K_2025-08-19.md'
Converted 'data\edgar_documents\MDT\8-K_2025-09-16' --> 'data\processed_data\MDT\8-K_2025-09-16.md'
Converted 'data\edgar_documents\MDT\8-K_2025-09-29' --> 'data\processed_data\MDT\8-K_2025-09-29.md'


2025-11-14 17:13:00,534 - INFO - Going to convert document batch...
2025-11-14 17:13:00,536 - INFO - Processing document 8-K_2025-10-21
2025-11-14 17:13:00,624 - INFO - Finished converting document 8-K_2025-10-21 in 0.14 sec.
2025-11-14 17:13:00,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:13:00,688 - INFO - Going to convert document batch...
2025-11-14 17:13:00,689 - INFO - Processing document 8-K_2025-11-03
2025-11-14 17:13:00,712 - INFO - Finished converting document 8-K_2025-11-03 in 0.05 sec.
2025-11-14 17:13:00,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\8-K_2025-10-21' --> 'data\processed_data\MDT\8-K_2025-10-21.md'
Converted 'data\edgar_documents\MDT\8-K_2025-11-03' --> 'data\processed_data\MDT\8-K_2025-11-03.md'


2025-11-14 17:13:01,422 - INFO - Going to convert document batch...
2025-11-14 17:13:01,422 - INFO - Processing document DEF-14A_2023-08-11
2025-11-14 17:13:02,636 - INFO - Finished converting document DEF-14A_2023-08-11 in 1.92 sec.
2025-11-14 17:13:03,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\DEF-14A_2023-08-11' --> 'data\processed_data\MDT\DEF-14A_2023-08-11.md'


2025-11-14 17:13:03,632 - INFO - Going to convert document batch...
2025-11-14 17:13:03,633 - INFO - Processing document DEF-14A_2024-08-09
2025-11-14 17:13:04,962 - INFO - Finished converting document DEF-14A_2024-08-09 in 1.80 sec.
2025-11-14 17:13:05,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MDT\DEF-14A_2024-08-09' --> 'data\processed_data\MDT\DEF-14A_2024-08-09.md'


2025-11-14 17:13:05,888 - INFO - Going to convert document batch...
2025-11-14 17:13:05,889 - INFO - Processing document DEF-14A_2025-08-25
2025-11-14 17:13:07,103 - INFO - Finished converting document DEF-14A_2025-08-25 in 1.64 sec.


Converted 'data\edgar_documents\MDT\DEF-14A_2025-08-25' --> 'data\processed_data\MDT\DEF-14A_2025-08-25.md'
Processed 89 new files. Errors: 6
Found 128 files to process in data\edgar_documents\MET


2025-11-14 17:13:07,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:13:11,292 - INFO - Going to convert document batch...
2025-11-14 17:13:11,293 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:13:11,294 - INFO - Processing document 10-K_2023-02-23
2025-11-14 17:13:19,141 - INFO - Finished converting document 10-K_2023-02-23 in 11.44 sec.


Converted 'data\edgar_documents\MET\10-K_2023-02-23' --> 'data\processed_data\MET\10-K_2023-02-23.md'


2025-11-14 17:13:22,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:13:26,410 - INFO - Going to convert document batch...
2025-11-14 17:13:26,411 - INFO - Processing document 10-K_2024-02-16
2025-11-14 17:13:37,099 - INFO - Finished converting document 10-K_2024-02-16 in 15.28 sec.


Converted 'data\edgar_documents\MET\10-K_2024-02-16' --> 'data\processed_data\MET\10-K_2024-02-16.md'


2025-11-14 17:13:40,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:13:45,108 - INFO - Going to convert document batch...
2025-11-14 17:13:45,109 - INFO - Processing document 10-K_2025-02-21
2025-11-14 17:14:01,618 - INFO - Finished converting document 10-K_2025-02-21 in 20.98 sec.


Converted 'data\edgar_documents\MET\10-K_2025-02-21' --> 'data\processed_data\MET\10-K_2025-02-21.md'


2025-11-14 17:14:05,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:14:08,308 - INFO - Going to convert document batch...
2025-11-14 17:14:08,309 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 17:14:15,197 - INFO - Finished converting document 10-Q_2023-05-04 in 10.30 sec.
2025-11-14 17:14:17,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\10-Q_2023-05-04' --> 'data\processed_data\MET\10-Q_2023-05-04.md'


2025-11-14 17:14:21,244 - INFO - Going to convert document batch...
2025-11-14 17:14:21,245 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 17:14:27,259 - INFO - Finished converting document 10-Q_2023-08-04 in 9.83 sec.
2025-11-14 17:14:30,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\10-Q_2023-08-04' --> 'data\processed_data\MET\10-Q_2023-08-04.md'


2025-11-14 17:14:34,137 - INFO - Going to convert document batch...
2025-11-14 17:14:34,138 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 17:14:41,276 - INFO - Finished converting document 10-Q_2023-11-02 in 10.47 sec.
2025-11-14 17:14:43,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\10-Q_2023-11-02' --> 'data\processed_data\MET\10-Q_2023-11-02.md'


2025-11-14 17:14:45,557 - INFO - Going to convert document batch...
2025-11-14 17:14:45,557 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 17:14:50,419 - INFO - Finished converting document 10-Q_2024-05-02 in 6.69 sec.
2025-11-14 17:14:52,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\10-Q_2024-05-02' --> 'data\processed_data\MET\10-Q_2024-05-02.md'


2025-11-14 17:14:55,450 - INFO - Going to convert document batch...
2025-11-14 17:14:55,450 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 17:15:00,277 - INFO - Finished converting document 10-Q_2024-08-01 in 8.14 sec.
2025-11-14 17:15:03,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\10-Q_2024-08-01' --> 'data\processed_data\MET\10-Q_2024-08-01.md'


2025-11-14 17:15:06,043 - INFO - Going to convert document batch...
2025-11-14 17:15:06,044 - INFO - Processing document 10-Q_2024-11-01
2025-11-14 17:15:10,867 - INFO - Finished converting document 10-Q_2024-11-01 in 7.53 sec.
2025-11-14 17:15:13,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\10-Q_2024-11-01' --> 'data\processed_data\MET\10-Q_2024-11-01.md'


2025-11-14 17:15:16,442 - INFO - Going to convert document batch...
2025-11-14 17:15:16,442 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 17:15:20,097 - INFO - Finished converting document 10-Q_2025-05-01 in 7.08 sec.
2025-11-14 17:15:21,968 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\10-Q_2025-05-01' --> 'data\processed_data\MET\10-Q_2025-05-01.md'


2025-11-14 17:15:24,933 - INFO - Going to convert document batch...
2025-11-14 17:15:24,934 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 17:15:30,196 - INFO - Finished converting document 10-Q_2025-08-07 in 8.41 sec.
2025-11-14 17:15:32,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\10-Q_2025-08-07' --> 'data\processed_data\MET\10-Q_2025-08-07.md'


2025-11-14 17:15:35,375 - INFO - Going to convert document batch...
2025-11-14 17:15:35,376 - INFO - Processing document 10-Q_2025-11-07
2025-11-14 17:15:40,901 - INFO - Finished converting document 10-Q_2025-11-07 in 8.69 sec.
2025-11-14 17:15:43,074 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:15:43,075 - ERROR - Input document 4_2023-01-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:15:43,076 - INFO - Going to convert document batch...
2025-11-14 17:15:43,09

Converted 'data\edgar_documents\MET\10-Q_2025-11-07' --> 'data\processed_data\MET\10-Q_2025-11-07.md'
Error processing data\edgar_documents\MET\4_2023-01-03: File format not allowed: data\edgar_documents\MET\4_2023-01-03
Converted 'data\edgar_documents\MET\4_2023-01-05' --> 'data\processed_data\MET\4_2023-01-05.md'
Converted 'data\edgar_documents\MET\4_2023-02-28' --> 'data\processed_data\MET\4_2023-02-28.md'


2025-11-14 17:15:43,252 - INFO - Going to convert document batch...
2025-11-14 17:15:43,252 - INFO - Processing document 4_2023-03-02
2025-11-14 17:15:43,271 - INFO - Finished converting document 4_2023-03-02 in 0.03 sec.
2025-11-14 17:15:43,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:43,311 - INFO - Going to convert document batch...
2025-11-14 17:15:43,314 - INFO - Processing document 4_2023-03-06
2025-11-14 17:15:43,335 - INFO - Finished converting document 4_2023-03-06 in 0.05 sec.
2025-11-14 17:15:43,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:43,387 - INFO - Going to convert document batch...
2025-11-14 17:15:43,388 - INFO - Processing document 4_2023-03-16
2025-11-14 17:15:43,408 - INFO - Finished converting document 4_2023-03-16 in 0.05 sec.
2025-11-14 17:15:43,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:43,449 - INFO - Going to convert document batch...
2025-11-14 17:15:43,449 - 

Converted 'data\edgar_documents\MET\4_2023-03-02' --> 'data\processed_data\MET\4_2023-03-02.md'
Converted 'data\edgar_documents\MET\4_2023-03-06' --> 'data\processed_data\MET\4_2023-03-06.md'
Converted 'data\edgar_documents\MET\4_2023-03-16' --> 'data\processed_data\MET\4_2023-03-16.md'


2025-11-14 17:15:43,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:43,512 - INFO - Going to convert document batch...
2025-11-14 17:15:43,513 - INFO - Processing document 4_2023-04-19
2025-11-14 17:15:43,533 - INFO - Finished converting document 4_2023-04-19 in 0.05 sec.
2025-11-14 17:15:43,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:43,596 - INFO - Going to convert document batch...
2025-11-14 17:15:43,598 - INFO - Processing document 4_2023-06-16
2025-11-14 17:15:43,620 - INFO - Finished converting document 4_2023-06-16 in 0.06 sec.
2025-11-14 17:15:43,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:43,665 - INFO - Going to convert document batch...
2025-11-14 17:15:43,665 - INFO - Processing document 4_2023-06-22


Converted 'data\edgar_documents\MET\4_2023-04-05' --> 'data\processed_data\MET\4_2023-04-05.md'
Converted 'data\edgar_documents\MET\4_2023-04-19' --> 'data\processed_data\MET\4_2023-04-19.md'
Converted 'data\edgar_documents\MET\4_2023-06-16' --> 'data\processed_data\MET\4_2023-06-16.md'


2025-11-14 17:15:43,683 - INFO - Finished converting document 4_2023-06-22 in 0.05 sec.
2025-11-14 17:15:43,726 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:15:43,727 - ERROR - Input document 4_2023-07-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:15:43,729 - INFO - Going to convert document batch...
2025-11-14 17:15:43,748 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:15:43,748 - ERROR - Input document 4_2023-07-11 with forma

Converted 'data\edgar_documents\MET\4_2023-06-22' --> 'data\processed_data\MET\4_2023-06-22.md'
Error processing data\edgar_documents\MET\4_2023-07-10: File format not allowed: data\edgar_documents\MET\4_2023-07-10
Error processing data\edgar_documents\MET\4_2023-07-11: File format not allowed: data\edgar_documents\MET\4_2023-07-11
Converted 'data\edgar_documents\MET\4_2023-08-11' --> 'data\processed_data\MET\4_2023-08-11.md'
Converted 'data\edgar_documents\MET\4_2023-09-05' --> 'data\processed_data\MET\4_2023-09-05.md'


2025-11-14 17:15:43,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:43,919 - INFO - Going to convert document batch...
2025-11-14 17:15:43,920 - INFO - Processing document 4_2023-09-18
2025-11-14 17:15:43,939 - INFO - Finished converting document 4_2023-09-18 in 0.06 sec.
2025-11-14 17:15:43,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:43,983 - INFO - Going to convert document batch...
2025-11-14 17:15:43,983 - INFO - Processing document 4_2023-10-04
2025-11-14 17:15:44,001 - INFO - Finished converting document 4_2023-10-04 in 0.05 sec.
2025-11-14 17:15:44,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:44,040 - INFO - Going to convert document batch...
2025-11-14 17:15:44,041 - INFO - Processing document 4_2023-12-18
2025-11-14 17:15:44,058 - INFO - Finished converting document 4_2023-12-18 in 0.05 sec.
2025-11-14 17:15:44,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\MET\4_2023-09-18' --> 'data\processed_data\MET\4_2023-09-18.md'
Converted 'data\edgar_documents\MET\4_2023-10-04' --> 'data\processed_data\MET\4_2023-10-04.md'
Converted 'data\edgar_documents\MET\4_2023-12-18' --> 'data\processed_data\MET\4_2023-12-18.md'
Converted 'data\edgar_documents\MET\4_2024-01-04' --> 'data\processed_data\MET\4_2024-01-04.md'


2025-11-14 17:15:44,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:44,173 - INFO - Going to convert document batch...
2025-11-14 17:15:44,174 - INFO - Processing document 4_2024-02-07
2025-11-14 17:15:44,201 - INFO - Finished converting document 4_2024-02-07 in 0.08 sec.
2025-11-14 17:15:44,267 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:15:44,268 - ERROR - Input document 4_2024-02-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:15

Converted 'data\edgar_documents\MET\4_2024-02-07' --> 'data\processed_data\MET\4_2024-02-07.md'
Error processing data\edgar_documents\MET\4_2024-02-26: File format not allowed: data\edgar_documents\MET\4_2024-02-26
Converted 'data\edgar_documents\MET\4_2024-02-28' --> 'data\processed_data\MET\4_2024-02-28.md'
Converted 'data\edgar_documents\MET\4_2024-02-29' --> 'data\processed_data\MET\4_2024-02-29.md'
Error processing data\edgar_documents\MET\4_2024-03-04: File format not allowed: data\edgar_documents\MET\4_2024-03-04


2025-11-14 17:15:44,428 - INFO - Going to convert document batch...
2025-11-14 17:15:44,429 - INFO - Processing document 4_2024-03-05
2025-11-14 17:15:44,445 - INFO - Finished converting document 4_2024-03-05 in 0.03 sec.
2025-11-14 17:15:44,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:44,486 - INFO - Going to convert document batch...
2025-11-14 17:15:44,487 - INFO - Processing document 4_2024-03-14
2025-11-14 17:15:44,503 - INFO - Finished converting document 4_2024-03-14 in 0.03 sec.
2025-11-14 17:15:44,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:44,541 - INFO - Going to convert document batch...
2025-11-14 17:15:44,542 - INFO - Processing document 4_2024-03-18
2025-11-14 17:15:44,560 - INFO - Finished converting document 4_2024-03-18 in 0.05 sec.
2025-11-14 17:15:44,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:44,616 - INFO - Going to convert document batch...
2025-11-14 17:15:44,617 - 

Converted 'data\edgar_documents\MET\4_2024-03-05' --> 'data\processed_data\MET\4_2024-03-05.md'
Converted 'data\edgar_documents\MET\4_2024-03-14' --> 'data\processed_data\MET\4_2024-03-14.md'
Converted 'data\edgar_documents\MET\4_2024-03-18' --> 'data\processed_data\MET\4_2024-03-18.md'
Converted 'data\edgar_documents\MET\4_2024-03-20' --> 'data\processed_data\MET\4_2024-03-20.md'


2025-11-14 17:15:44,679 - INFO - Going to convert document batch...
2025-11-14 17:15:44,680 - INFO - Processing document 4_2024-04-03
2025-11-14 17:15:44,697 - INFO - Finished converting document 4_2024-04-03 in 0.03 sec.
2025-11-14 17:15:44,759 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:15:44,760 - ERROR - Input document 4_2024-06-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:15:44,761 - INFO - Going to convert document batch...
2025-11-14 17:15:44,791 - IN

Converted 'data\edgar_documents\MET\4_2024-04-03' --> 'data\processed_data\MET\4_2024-04-03.md'
Error processing data\edgar_documents\MET\4_2024-06-03: File format not allowed: data\edgar_documents\MET\4_2024-06-03
Error processing data\edgar_documents\MET\4_2024-06-04: File format not allowed: data\edgar_documents\MET\4_2024-06-04
Converted 'data\edgar_documents\MET\4_2024-06-13' --> 'data\processed_data\MET\4_2024-06-13.md'


2025-11-14 17:15:44,910 - INFO - Finished converting document 4_2024-06-20 in 0.03 sec.
2025-11-14 17:15:44,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:44,951 - INFO - Going to convert document batch...
2025-11-14 17:15:44,952 - INFO - Processing document 4_2024-08-05
2025-11-14 17:15:44,969 - INFO - Finished converting document 4_2024-08-05 in 0.05 sec.
2025-11-14 17:15:45,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,009 - INFO - Going to convert document batch...
2025-11-14 17:15:45,009 - INFO - Processing document 4_2024-09-12
2025-11-14 17:15:45,027 - INFO - Finished converting document 4_2024-09-12 in 0.05 sec.
2025-11-14 17:15:45,065 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:15:45,066 - ERROR - Input document 4_2024-09-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFo

Converted 'data\edgar_documents\MET\4_2024-06-20' --> 'data\processed_data\MET\4_2024-06-20.md'
Converted 'data\edgar_documents\MET\4_2024-08-05' --> 'data\processed_data\MET\4_2024-08-05.md'
Converted 'data\edgar_documents\MET\4_2024-09-12' --> 'data\processed_data\MET\4_2024-09-12.md'
Error processing data\edgar_documents\MET\4_2024-09-26: File format not allowed: data\edgar_documents\MET\4_2024-09-26
Error processing data\edgar_documents\MET\4_2024-09-27: File format not allowed: data\edgar_documents\MET\4_2024-09-27


2025-11-14 17:15:45,108 - INFO - Processing document 4_2024-10-03
2025-11-14 17:15:45,125 - INFO - Finished converting document 4_2024-10-03 in 0.05 sec.
2025-11-14 17:15:45,158 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,169 - INFO - Going to convert document batch...
2025-11-14 17:15:45,170 - INFO - Processing document 4_2024-12-17
2025-11-14 17:15:45,195 - INFO - Finished converting document 4_2024-12-17 in 0.05 sec.
2025-11-14 17:15:45,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,237 - INFO - Going to convert document batch...
2025-11-14 17:15:45,238 - INFO - Processing document 4_2024-12-18
2025-11-14 17:15:45,254 - INFO - Finished converting document 4_2024-12-18 in 0.03 sec.
2025-11-14 17:15:45,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,292 - INFO - Going to convert document batch...
2025-11-14 17:15:45,292 - INFO - Processing document 4_2025-01-06
2025-11-14 17:15:45,311 - IN

Converted 'data\edgar_documents\MET\4_2024-10-03' --> 'data\processed_data\MET\4_2024-10-03.md'
Converted 'data\edgar_documents\MET\4_2024-12-17' --> 'data\processed_data\MET\4_2024-12-17.md'
Converted 'data\edgar_documents\MET\4_2024-12-18' --> 'data\processed_data\MET\4_2024-12-18.md'
Converted 'data\edgar_documents\MET\4_2025-01-06' --> 'data\processed_data\MET\4_2025-01-06.md'


2025-11-14 17:15:45,348 - INFO - Going to convert document batch...
2025-11-14 17:15:45,348 - INFO - Processing document 4_2025-02-27
2025-11-14 17:15:45,374 - INFO - Finished converting document 4_2025-02-27 in 0.05 sec.
2025-11-14 17:15:45,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,415 - INFO - Going to convert document batch...
2025-11-14 17:15:45,416 - INFO - Processing document 4_2025-03-05
2025-11-14 17:15:45,433 - INFO - Finished converting document 4_2025-03-05 in 0.05 sec.
2025-11-14 17:15:45,475 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:15:45,476 - ERROR - Input document 4_2025-03-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\MET\4_2025-02-27' --> 'data\processed_data\MET\4_2025-02-27.md'
Converted 'data\edgar_documents\MET\4_2025-03-05' --> 'data\processed_data\MET\4_2025-03-05.md'
Error processing data\edgar_documents\MET\4_2025-03-11: File format not allowed: data\edgar_documents\MET\4_2025-03-11
Error processing data\edgar_documents\MET\4_2025-03-12: File format not allowed: data\edgar_documents\MET\4_2025-03-12
Converted 'data\edgar_documents\MET\4_2025-03-13' --> 'data\processed_data\MET\4_2025-03-13.md'


2025-11-14 17:15:45,576 - INFO - Processing document 4_2025-04-03
2025-11-14 17:15:45,592 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.
2025-11-14 17:15:45,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,648 - INFO - Going to convert document batch...
2025-11-14 17:15:45,650 - INFO - Processing document 4_2025-05-05
2025-11-14 17:15:45,680 - INFO - Finished converting document 4_2025-05-05 in 0.06 sec.
2025-11-14 17:15:45,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,718 - INFO - Going to convert document batch...
2025-11-14 17:15:45,719 - INFO - Processing document 4_2025-05-13
2025-11-14 17:15:45,737 - INFO - Finished converting document 4_2025-05-13 in 0.03 sec.
2025-11-14 17:15:45,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,790 - INFO - Going to convert document batch...
2025-11-14 17:15:45,790 - INFO - Processing document 4_2025-06-12
2025-11-14 17:15:45,807 - IN

Converted 'data\edgar_documents\MET\4_2025-04-03' --> 'data\processed_data\MET\4_2025-04-03.md'
Converted 'data\edgar_documents\MET\4_2025-05-05' --> 'data\processed_data\MET\4_2025-05-05.md'
Converted 'data\edgar_documents\MET\4_2025-05-13' --> 'data\processed_data\MET\4_2025-05-13.md'


2025-11-14 17:15:45,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,846 - INFO - Going to convert document batch...
2025-11-14 17:15:45,847 - INFO - Processing document 4_2025-06-20
2025-11-14 17:15:45,866 - INFO - Finished converting document 4_2025-06-20 in 0.03 sec.
2025-11-14 17:15:45,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,906 - INFO - Going to convert document batch...
2025-11-14 17:15:45,907 - INFO - Processing document 4_2025-09-11
2025-11-14 17:15:45,943 - INFO - Finished converting document 4_2025-09-11 in 0.05 sec.
2025-11-14 17:15:45,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:45,994 - INFO - Going to convert document batch...
2025-11-14 17:15:45,995 - INFO - Processing document 4_2025-10-03
2025-11-14 17:15:46,013 - INFO - Finished converting document 4_2025-10-03 in 0.05 sec.


Converted 'data\edgar_documents\MET\4_2025-06-12' --> 'data\processed_data\MET\4_2025-06-12.md'
Converted 'data\edgar_documents\MET\4_2025-06-20' --> 'data\processed_data\MET\4_2025-06-20.md'
Converted 'data\edgar_documents\MET\4_2025-09-11' --> 'data\processed_data\MET\4_2025-09-11.md'


2025-11-14 17:15:46,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,057 - INFO - Going to convert document batch...
2025-11-14 17:15:46,057 - INFO - Processing document 4_2025-11-04
2025-11-14 17:15:46,078 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 17:15:46,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,127 - INFO - Going to convert document batch...
2025-11-14 17:15:46,128 - INFO - Processing document 8-K_2023-01-06
2025-11-14 17:15:46,153 - INFO - Finished converting document 8-K_2023-01-06 in 0.06 sec.
2025-11-14 17:15:46,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,189 - INFO - Going to convert document batch...
2025-11-14 17:15:46,190 - INFO - Processing document 8-K_2023-01-11
2025-11-14 17:15:46,207 - INFO - Finished converting document 8-K_2023-01-11 in 0.03 sec.


Converted 'data\edgar_documents\MET\4_2025-10-03' --> 'data\processed_data\MET\4_2025-10-03.md'
Converted 'data\edgar_documents\MET\4_2025-11-04' --> 'data\processed_data\MET\4_2025-11-04.md'
Converted 'data\edgar_documents\MET\8-K_2023-01-06' --> 'data\processed_data\MET\8-K_2023-01-06.md'


2025-11-14 17:15:46,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,244 - INFO - Going to convert document batch...
2025-11-14 17:15:46,245 - INFO - Processing document 8-K_2023-02-01
2025-11-14 17:15:46,268 - INFO - Finished converting document 8-K_2023-02-01 in 0.05 sec.
2025-11-14 17:15:46,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,326 - INFO - Going to convert document batch...
2025-11-14 17:15:46,327 - INFO - Processing document 8-K_2023-02-07
2025-11-14 17:15:46,348 - INFO - Finished converting document 8-K_2023-02-07 in 0.06 sec.
2025-11-14 17:15:46,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,385 - INFO - Going to convert document batch...
2025-11-14 17:15:46,386 - INFO - Processing document 8-K_2023-02-15
2025-11-14 17:15:46,403 - INFO - Finished converting document 8-K_2023-02-15 in 0.05 sec.


Converted 'data\edgar_documents\MET\8-K_2023-01-11' --> 'data\processed_data\MET\8-K_2023-01-11.md'
Converted 'data\edgar_documents\MET\8-K_2023-02-01' --> 'data\processed_data\MET\8-K_2023-02-01.md'
Converted 'data\edgar_documents\MET\8-K_2023-02-07' --> 'data\processed_data\MET\8-K_2023-02-07.md'


2025-11-14 17:15:46,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,436 - INFO - Going to convert document batch...
2025-11-14 17:15:46,436 - INFO - Processing document 8-K_2023-03-01
2025-11-14 17:15:46,452 - INFO - Finished converting document 8-K_2023-03-01 in 0.05 sec.
2025-11-14 17:15:46,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,484 - INFO - Going to convert document batch...
2025-11-14 17:15:46,485 - INFO - Processing document 8-K_2023-03-06
2025-11-14 17:15:46,503 - INFO - Finished converting document 8-K_2023-03-06 in 0.05 sec.
2025-11-14 17:15:46,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,543 - INFO - Going to convert document batch...
2025-11-14 17:15:46,545 - INFO - Processing document 8-K_2023-04-17
2025-11-14 17:15:46,579 - INFO - Finished converting document 8-K_2023-04-17 in 0.06 sec.


Converted 'data\edgar_documents\MET\8-K_2023-02-15' --> 'data\processed_data\MET\8-K_2023-02-15.md'
Converted 'data\edgar_documents\MET\8-K_2023-03-01' --> 'data\processed_data\MET\8-K_2023-03-01.md'
Converted 'data\edgar_documents\MET\8-K_2023-03-06' --> 'data\processed_data\MET\8-K_2023-03-06.md'


2025-11-14 17:15:46,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,624 - INFO - Going to convert document batch...
2025-11-14 17:15:46,626 - INFO - Processing document 8-K_2023-05-03
2025-11-14 17:15:46,650 - INFO - Finished converting document 8-K_2023-05-03 in 0.05 sec.
2025-11-14 17:15:46,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,693 - INFO - Going to convert document batch...
2025-11-14 17:15:46,693 - INFO - Processing document 8-K_2023-05-09
2025-11-14 17:15:46,711 - INFO - Finished converting document 8-K_2023-05-09 in 0.03 sec.
2025-11-14 17:15:46,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,742 - INFO - Going to convert document batch...
2025-11-14 17:15:46,743 - INFO - Processing document 8-K_2023-05-15
2025-11-14 17:15:46,759 - INFO - Finished converting document 8-K_2023-05-15 in 0.03 sec.
2025-11-14 17:15:46,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\8-K_2023-04-17' --> 'data\processed_data\MET\8-K_2023-04-17.md'
Converted 'data\edgar_documents\MET\8-K_2023-05-03' --> 'data\processed_data\MET\8-K_2023-05-03.md'
Converted 'data\edgar_documents\MET\8-K_2023-05-09' --> 'data\processed_data\MET\8-K_2023-05-09.md'
Converted 'data\edgar_documents\MET\8-K_2023-05-15' --> 'data\processed_data\MET\8-K_2023-05-15.md'


2025-11-14 17:15:46,794 - INFO - Going to convert document batch...
2025-11-14 17:15:46,795 - INFO - Processing document 8-K_2023-05-25
2025-11-14 17:15:46,813 - INFO - Finished converting document 8-K_2023-05-25 in 0.05 sec.
2025-11-14 17:15:46,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,849 - INFO - Going to convert document batch...
2025-11-14 17:15:46,850 - INFO - Processing document 8-K_2023-06-21
2025-11-14 17:15:46,865 - INFO - Finished converting document 8-K_2023-06-21 in 0.03 sec.
2025-11-14 17:15:46,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:46,908 - INFO - Going to convert document batch...
2025-11-14 17:15:46,909 - INFO - Processing document 8-K_2023-06-23
2025-11-14 17:15:46,943 - INFO - Finished converting document 8-K_2023-06-23 in 0.06 sec.
2025-11-14 17:15:46,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,007 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\MET\8-K_2023-05-25' --> 'data\processed_data\MET\8-K_2023-05-25.md'
Converted 'data\edgar_documents\MET\8-K_2023-06-21' --> 'data\processed_data\MET\8-K_2023-06-21.md'
Converted 'data\edgar_documents\MET\8-K_2023-06-23' --> 'data\processed_data\MET\8-K_2023-06-23.md'


2025-11-14 17:15:47,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,066 - INFO - Going to convert document batch...
2025-11-14 17:15:47,067 - INFO - Processing document 8-K_2023-08-02
2025-11-14 17:15:47,091 - INFO - Finished converting document 8-K_2023-08-02 in 0.05 sec.
2025-11-14 17:15:47,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,131 - INFO - Going to convert document batch...
2025-11-14 17:15:47,132 - INFO - Processing document 8-K_2023-08-15
2025-11-14 17:15:47,150 - INFO - Finished converting document 8-K_2023-08-15 in 0.03 sec.
2025-11-14 17:15:47,198 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,211 - INFO - Going to convert document batch...
2025-11-14 17:15:47,212 - INFO - Processing document 8-K_2023-10-05
2025-11-14 17:15:47,237 - INFO - Finished converting document 8-K_2023-10-05 in 0.08 sec.


Converted 'data\edgar_documents\MET\8-K_2023-07-12' --> 'data\processed_data\MET\8-K_2023-07-12.md'
Converted 'data\edgar_documents\MET\8-K_2023-08-02' --> 'data\processed_data\MET\8-K_2023-08-02.md'
Converted 'data\edgar_documents\MET\8-K_2023-08-15' --> 'data\processed_data\MET\8-K_2023-08-15.md'


2025-11-14 17:15:47,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,276 - INFO - Going to convert document batch...
2025-11-14 17:15:47,277 - INFO - Processing document 8-K_2023-11-01
2025-11-14 17:15:47,299 - INFO - Finished converting document 8-K_2023-11-01 in 0.05 sec.
2025-11-14 17:15:47,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,363 - INFO - Going to convert document batch...
2025-11-14 17:15:47,364 - INFO - Processing document 8-K_2023-11-15
2025-11-14 17:15:47,380 - INFO - Finished converting document 8-K_2023-11-15 in 0.06 sec.
2025-11-14 17:15:47,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,413 - INFO - Going to convert document batch...
2025-11-14 17:15:47,415 - INFO - Processing document 8-K_2023-11-16
2025-11-14 17:15:47,430 - INFO - Finished converting document 8-K_2023-11-16 in 0.03 sec.
2025-11-14 17:15:47,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\8-K_2023-10-05' --> 'data\processed_data\MET\8-K_2023-10-05.md'
Converted 'data\edgar_documents\MET\8-K_2023-11-01' --> 'data\processed_data\MET\8-K_2023-11-01.md'
Converted 'data\edgar_documents\MET\8-K_2023-11-15' --> 'data\processed_data\MET\8-K_2023-11-15.md'
Converted 'data\edgar_documents\MET\8-K_2023-11-16' --> 'data\processed_data\MET\8-K_2023-11-16.md'


2025-11-14 17:15:47,463 - INFO - Going to convert document batch...
2025-11-14 17:15:47,464 - INFO - Processing document 8-K_2024-01-31
2025-11-14 17:15:47,492 - INFO - Finished converting document 8-K_2024-01-31 in 0.05 sec.
2025-11-14 17:15:47,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,532 - INFO - Going to convert document batch...
2025-11-14 17:15:47,533 - INFO - Processing document 8-K_2024-02-15
2025-11-14 17:15:47,552 - INFO - Finished converting document 8-K_2024-02-15 in 0.05 sec.
2025-11-14 17:15:47,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,609 - INFO - Going to convert document batch...
2025-11-14 17:15:47,610 - INFO - Processing document 8-K_2024-02-28
2025-11-14 17:15:47,625 - INFO - Finished converting document 8-K_2024-02-28 in 0.06 sec.
2025-11-14 17:15:47,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,675 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\MET\8-K_2024-01-31' --> 'data\processed_data\MET\8-K_2024-01-31.md'
Converted 'data\edgar_documents\MET\8-K_2024-02-15' --> 'data\processed_data\MET\8-K_2024-02-15.md'
Converted 'data\edgar_documents\MET\8-K_2024-02-28' --> 'data\processed_data\MET\8-K_2024-02-28.md'


2025-11-14 17:15:47,716 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,731 - INFO - Going to convert document batch...
2025-11-14 17:15:47,732 - INFO - Processing document 8-K_2024-03-07
2025-11-14 17:15:47,766 - INFO - Finished converting document 8-K_2024-03-07 in 0.06 sec.
2025-11-14 17:15:47,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,830 - INFO - Going to convert document batch...
2025-11-14 17:15:47,831 - INFO - Processing document 8-K_2024-03-12
2025-11-14 17:15:47,849 - INFO - Finished converting document 8-K_2024-03-12 in 0.06 sec.
2025-11-14 17:15:47,898 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\8-K_2024-03-05' --> 'data\processed_data\MET\8-K_2024-03-05.md'
Converted 'data\edgar_documents\MET\8-K_2024-03-07' --> 'data\processed_data\MET\8-K_2024-03-07.md'
Converted 'data\edgar_documents\MET\8-K_2024-03-12' --> 'data\processed_data\MET\8-K_2024-03-12.md'


2025-11-14 17:15:47,913 - INFO - Going to convert document batch...
2025-11-14 17:15:47,914 - INFO - Processing document 8-K_2024-05-01
2025-11-14 17:15:47,948 - INFO - Finished converting document 8-K_2024-05-01 in 0.09 sec.
2025-11-14 17:15:47,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:47,990 - INFO - Going to convert document batch...
2025-11-14 17:15:47,991 - INFO - Processing document 8-K_2024-05-15
2025-11-14 17:15:48,008 - INFO - Finished converting document 8-K_2024-05-15 in 0.03 sec.
2025-11-14 17:15:48,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,045 - INFO - Going to convert document batch...
2025-11-14 17:15:48,045 - INFO - Processing document 8-K_2024-06-05
2025-11-14 17:15:48,067 - INFO - Finished converting document 8-K_2024-06-05 in 0.05 sec.
2025-11-14 17:15:48,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,107 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\MET\8-K_2024-05-01' --> 'data\processed_data\MET\8-K_2024-05-01.md'
Converted 'data\edgar_documents\MET\8-K_2024-05-15' --> 'data\processed_data\MET\8-K_2024-05-15.md'
Converted 'data\edgar_documents\MET\8-K_2024-06-05' --> 'data\processed_data\MET\8-K_2024-06-05.md'


2025-11-14 17:15:48,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,176 - INFO - Going to convert document batch...
2025-11-14 17:15:48,177 - INFO - Processing document 8-K_2024-07-31
2025-11-14 17:15:48,222 - INFO - Finished converting document 8-K_2024-07-31 in 0.06 sec.
2025-11-14 17:15:48,276 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,286 - INFO - Going to convert document batch...
2025-11-14 17:15:48,287 - INFO - Processing document 8-K_2024-08-15
2025-11-14 17:15:48,304 - INFO - Finished converting document 8-K_2024-08-15 in 0.05 sec.
2025-11-14 17:15:48,329 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,342 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MET\8-K_2024-06-24' --> 'data\processed_data\MET\8-K_2024-06-24.md'
Converted 'data\edgar_documents\MET\8-K_2024-07-31' --> 'data\processed_data\MET\8-K_2024-07-31.md'
Converted 'data\edgar_documents\MET\8-K_2024-08-15' --> 'data\processed_data\MET\8-K_2024-08-15.md'


2025-11-14 17:15:48,343 - INFO - Processing document 8-K_2024-09-30
2025-11-14 17:15:48,367 - INFO - Finished converting document 8-K_2024-09-30 in 0.05 sec.
2025-11-14 17:15:48,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,407 - INFO - Going to convert document batch...
2025-11-14 17:15:48,409 - INFO - Processing document 8-K_2024-10-30
2025-11-14 17:15:48,431 - INFO - Finished converting document 8-K_2024-10-30 in 0.05 sec.
2025-11-14 17:15:48,456 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,465 - INFO - Going to convert document batch...
2025-11-14 17:15:48,466 - INFO - Processing document 8-K_2024-11-15
2025-11-14 17:15:48,482 - INFO - Finished converting document 8-K_2024-11-15 in 0.05 sec.
2025-11-14 17:15:48,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,514 - INFO - Going to convert document batch...
2025-11-14 17:15:48,515 - INFO - Processing document 8-K_2024-12-11
2025-11-14 17:

Converted 'data\edgar_documents\MET\8-K_2024-09-30' --> 'data\processed_data\MET\8-K_2024-09-30.md'
Converted 'data\edgar_documents\MET\8-K_2024-10-30' --> 'data\processed_data\MET\8-K_2024-10-30.md'
Converted 'data\edgar_documents\MET\8-K_2024-11-15' --> 'data\processed_data\MET\8-K_2024-11-15.md'
Converted 'data\edgar_documents\MET\8-K_2024-12-11' --> 'data\processed_data\MET\8-K_2024-12-11.md'


2025-11-14 17:15:48,560 - INFO - Processing document 8-K_2024-12-12
2025-11-14 17:15:48,579 - INFO - Finished converting document 8-K_2024-12-12 in 0.05 sec.
2025-11-14 17:15:48,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,618 - INFO - Going to convert document batch...
2025-11-14 17:15:48,619 - INFO - Processing document 8-K_2025-01-10
2025-11-14 17:15:48,634 - INFO - Finished converting document 8-K_2025-01-10 in 0.03 sec.
2025-11-14 17:15:48,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,668 - INFO - Going to convert document batch...
2025-11-14 17:15:48,668 - INFO - Processing document 8-K_2025-02-05
2025-11-14 17:15:48,701 - INFO - Finished converting document 8-K_2025-02-05 in 0.06 sec.
2025-11-14 17:15:48,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,753 - INFO - Going to convert document batch...
2025-11-14 17:15:48,754 - INFO - Processing document 8-K_2025-02-18
2025-11-14 17:

Converted 'data\edgar_documents\MET\8-K_2024-12-12' --> 'data\processed_data\MET\8-K_2024-12-12.md'
Converted 'data\edgar_documents\MET\8-K_2025-01-10' --> 'data\processed_data\MET\8-K_2025-01-10.md'
Converted 'data\edgar_documents\MET\8-K_2025-02-05' --> 'data\processed_data\MET\8-K_2025-02-05.md'


2025-11-14 17:15:48,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,805 - INFO - Going to convert document batch...
2025-11-14 17:15:48,806 - INFO - Processing document 8-K_2025-02-27
2025-11-14 17:15:48,820 - INFO - Finished converting document 8-K_2025-02-27 in 0.03 sec.
2025-11-14 17:15:48,844 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,856 - INFO - Going to convert document batch...
2025-11-14 17:15:48,858 - INFO - Processing document 8-K_2025-03-04
2025-11-14 17:15:48,874 - INFO - Finished converting document 8-K_2025-03-04 in 0.05 sec.
2025-11-14 17:15:48,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:48,903 - INFO - Going to convert document batch...
2025-11-14 17:15:48,904 - INFO - Processing document 8-K_2025-03-05
2025-11-14 17:15:48,920 - INFO - Finished converting document 8-K_2025-03-05 in 0.05 sec.
2025-11-14 17:15:48,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\MET\8-K_2025-02-18' --> 'data\processed_data\MET\8-K_2025-02-18.md'
Converted 'data\edgar_documents\MET\8-K_2025-02-27' --> 'data\processed_data\MET\8-K_2025-02-27.md'
Converted 'data\edgar_documents\MET\8-K_2025-03-04' --> 'data\processed_data\MET\8-K_2025-03-04.md'
Converted 'data\edgar_documents\MET\8-K_2025-03-05' --> 'data\processed_data\MET\8-K_2025-03-05.md'


2025-11-14 17:15:49,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,029 - INFO - Going to convert document batch...
2025-11-14 17:15:49,030 - INFO - Processing document 8-K_2025-03-28
2025-11-14 17:15:49,049 - INFO - Finished converting document 8-K_2025-03-28 in 0.05 sec.
2025-11-14 17:15:49,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,083 - INFO - Going to convert document batch...
2025-11-14 17:15:49,084 - INFO - Processing document 8-K_2025-04-30
2025-11-14 17:15:49,102 - INFO - Finished converting document 8-K_2025-04-30 in 0.03 sec.
2025-11-14 17:15:49,126 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,136 - INFO - Going to convert document batch...
2025-11-14 17:15:49,137 - INFO - Processing document 8-K_2025-05-15
2025-11-14 17:15:49,154 - INFO - Finished converting document 8-K_2025-05-15 in 0.05 sec.
2025-11-14 17:15:49,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\MET\8-K_2025-03-13' --> 'data\processed_data\MET\8-K_2025-03-13.md'
Converted 'data\edgar_documents\MET\8-K_2025-03-28' --> 'data\processed_data\MET\8-K_2025-03-28.md'
Converted 'data\edgar_documents\MET\8-K_2025-04-30' --> 'data\processed_data\MET\8-K_2025-04-30.md'
Converted 'data\edgar_documents\MET\8-K_2025-05-15' --> 'data\processed_data\MET\8-K_2025-05-15.md'


2025-11-14 17:15:49,186 - INFO - Processing document 8-K_2025-06-17
2025-11-14 17:15:49,202 - INFO - Finished converting document 8-K_2025-06-17 in 0.05 sec.
2025-11-14 17:15:49,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,240 - INFO - Going to convert document batch...
2025-11-14 17:15:49,241 - INFO - Processing document 8-K_2025-06-20
2025-11-14 17:15:49,264 - INFO - Finished converting document 8-K_2025-06-20 in 0.06 sec.
2025-11-14 17:15:49,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,300 - INFO - Going to convert document batch...
2025-11-14 17:15:49,301 - INFO - Processing document 8-K_2025-06-23
2025-11-14 17:15:49,316 - INFO - Finished converting document 8-K_2025-06-23 in 0.03 sec.
2025-11-14 17:15:49,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,377 - INFO - Going to convert document batch...
2025-11-14 17:15:49,377 - INFO - Processing document 8-K_2025-07-01


Converted 'data\edgar_documents\MET\8-K_2025-06-17' --> 'data\processed_data\MET\8-K_2025-06-17.md'
Converted 'data\edgar_documents\MET\8-K_2025-06-20' --> 'data\processed_data\MET\8-K_2025-06-20.md'
Converted 'data\edgar_documents\MET\8-K_2025-06-23' --> 'data\processed_data\MET\8-K_2025-06-23.md'


2025-11-14 17:15:49,395 - INFO - Finished converting document 8-K_2025-07-01 in 0.06 sec.
2025-11-14 17:15:49,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,431 - INFO - Going to convert document batch...
2025-11-14 17:15:49,432 - INFO - Processing document 8-K_2025-07-30
2025-11-14 17:15:49,449 - INFO - Finished converting document 8-K_2025-07-30 in 0.05 sec.
2025-11-14 17:15:49,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,482 - INFO - Going to convert document batch...
2025-11-14 17:15:49,482 - INFO - Processing document 8-K_2025-08-06
2025-11-14 17:15:49,505 - INFO - Finished converting document 8-K_2025-08-06 in 0.05 sec.
2025-11-14 17:15:49,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,543 - INFO - Going to convert document batch...
2025-11-14 17:15:49,543 - INFO - Processing document 8-K_2025-08-15
2025-11-14 17:15:49,560 - INFO - Finished converting document 8-K_2025-08-15 in 0.

Converted 'data\edgar_documents\MET\8-K_2025-07-01' --> 'data\processed_data\MET\8-K_2025-07-01.md'
Converted 'data\edgar_documents\MET\8-K_2025-07-30' --> 'data\processed_data\MET\8-K_2025-07-30.md'
Converted 'data\edgar_documents\MET\8-K_2025-08-06' --> 'data\processed_data\MET\8-K_2025-08-06.md'
Converted 'data\edgar_documents\MET\8-K_2025-08-15' --> 'data\processed_data\MET\8-K_2025-08-15.md'


2025-11-14 17:15:49,595 - INFO - Processing document 8-K_2025-09-02
2025-11-14 17:15:49,610 - INFO - Finished converting document 8-K_2025-09-02 in 0.05 sec.
2025-11-14 17:15:49,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,642 - INFO - Going to convert document batch...
2025-11-14 17:15:49,643 - INFO - Processing document 8-K_2025-09-15
2025-11-14 17:15:49,663 - INFO - Finished converting document 8-K_2025-09-15 in 0.05 sec.
2025-11-14 17:15:49,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,695 - INFO - Going to convert document batch...
2025-11-14 17:15:49,696 - INFO - Processing document 8-K_2025-09-22
2025-11-14 17:15:49,710 - INFO - Finished converting document 8-K_2025-09-22 in 0.03 sec.
2025-11-14 17:15:49,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:15:49,742 - INFO - Going to convert document batch...
2025-11-14 17:15:49,743 - INFO - Processing document 8-K_2025-10-14
2025-11-14 17:

Converted 'data\edgar_documents\MET\8-K_2025-09-02' --> 'data\processed_data\MET\8-K_2025-09-02.md'
Converted 'data\edgar_documents\MET\8-K_2025-09-15' --> 'data\processed_data\MET\8-K_2025-09-15.md'
Converted 'data\edgar_documents\MET\8-K_2025-09-22' --> 'data\processed_data\MET\8-K_2025-09-22.md'
Converted 'data\edgar_documents\MET\8-K_2025-10-14' --> 'data\processed_data\MET\8-K_2025-10-14.md'


2025-11-14 17:15:49,795 - INFO - Processing document 8-K_2025-11-05
2025-11-14 17:15:49,816 - INFO - Finished converting document 8-K_2025-11-05 in 0.05 sec.
2025-11-14 17:15:49,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\8-K_2025-11-05' --> 'data\processed_data\MET\8-K_2025-11-05.md'


2025-11-14 17:15:51,544 - INFO - Going to convert document batch...
2025-11-14 17:15:51,546 - INFO - Processing document DEF-14A_2023-04-28
2025-11-14 17:15:54,406 - INFO - Finished converting document DEF-14A_2023-04-28 in 4.58 sec.
2025-11-14 17:15:55,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\DEF-14A_2023-04-28' --> 'data\processed_data\MET\DEF-14A_2023-04-28.md'


2025-11-14 17:15:56,553 - INFO - Going to convert document batch...
2025-11-14 17:15:56,554 - INFO - Processing document DEF-14A_2024-04-26
2025-11-14 17:16:00,923 - INFO - Finished converting document DEF-14A_2024-04-26 in 5.53 sec.
2025-11-14 17:16:02,354 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\DEF-14A_2024-04-26' --> 'data\processed_data\MET\DEF-14A_2024-04-26.md'


2025-11-14 17:16:03,487 - INFO - Going to convert document batch...
2025-11-14 17:16:03,488 - INFO - Processing document DEF-14A_2025-04-29
2025-11-14 17:16:10,688 - INFO - Finished converting document DEF-14A_2025-04-29 in 8.41 sec.
2025-11-14 17:16:12,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MET\DEF-14A_2025-04-29' --> 'data\processed_data\MET\DEF-14A_2025-04-29.md'
Processed 117 new files. Errors: 11
Found 366 files to process in data\edgar_documents\META


2025-11-14 17:16:13,430 - INFO - Going to convert document batch...
2025-11-14 17:16:13,431 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:16:13,431 - INFO - Processing document 10-K_2023-02-02
2025-11-14 17:16:15,217 - INFO - Finished converting document 10-K_2023-02-02 in 2.42 sec.
2025-11-14 17:16:15,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-K_2023-02-02' --> 'data\processed_data\META\10-K_2023-02-02.md'


2025-11-14 17:16:16,697 - INFO - Going to convert document batch...
2025-11-14 17:16:16,698 - INFO - Processing document 10-K_2024-02-02
2025-11-14 17:16:18,506 - INFO - Finished converting document 10-K_2024-02-02 in 2.80 sec.
2025-11-14 17:16:19,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-K_2024-02-02' --> 'data\processed_data\META\10-K_2024-02-02.md'


2025-11-14 17:16:19,875 - INFO - Going to convert document batch...
2025-11-14 17:16:19,876 - INFO - Processing document 10-K_2025-01-30
2025-11-14 17:16:21,470 - INFO - Finished converting document 10-K_2025-01-30 in 2.44 sec.
2025-11-14 17:16:21,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-K_2025-01-30' --> 'data\processed_data\META\10-K_2025-01-30.md'


2025-11-14 17:16:22,324 - INFO - Going to convert document batch...
2025-11-14 17:16:22,325 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 17:16:23,061 - INFO - Finished converting document 10-Q_2023-04-27 in 1.14 sec.
2025-11-14 17:16:23,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-Q_2023-04-27' --> 'data\processed_data\META\10-Q_2023-04-27.md'


2025-11-14 17:16:24,327 - INFO - Going to convert document batch...
2025-11-14 17:16:24,329 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 17:16:25,100 - INFO - Finished converting document 10-Q_2023-07-27 in 1.67 sec.
2025-11-14 17:16:25,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-Q_2023-07-27' --> 'data\processed_data\META\10-Q_2023-07-27.md'


2025-11-14 17:16:26,249 - INFO - Going to convert document batch...
2025-11-14 17:16:26,250 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 17:16:27,028 - INFO - Finished converting document 10-Q_2023-10-26 in 1.56 sec.
2025-11-14 17:16:27,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-Q_2023-10-26' --> 'data\processed_data\META\10-Q_2023-10-26.md'


2025-11-14 17:16:27,751 - INFO - Going to convert document batch...
2025-11-14 17:16:27,752 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 17:16:28,395 - INFO - Finished converting document 10-Q_2024-04-25 in 0.97 sec.
2025-11-14 17:16:28,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-Q_2024-04-25' --> 'data\processed_data\META\10-Q_2024-04-25.md'


2025-11-14 17:16:29,467 - INFO - Going to convert document batch...
2025-11-14 17:16:29,468 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 17:16:30,153 - INFO - Finished converting document 10-Q_2024-08-01 in 1.45 sec.
2025-11-14 17:16:30,530 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-Q_2024-08-01' --> 'data\processed_data\META\10-Q_2024-08-01.md'


2025-11-14 17:16:30,887 - INFO - Going to convert document batch...
2025-11-14 17:16:30,888 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 17:16:31,623 - INFO - Finished converting document 10-Q_2024-10-31 in 1.12 sec.
2025-11-14 17:16:32,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-Q_2024-10-31' --> 'data\processed_data\META\10-Q_2024-10-31.md'


2025-11-14 17:16:32,663 - INFO - Going to convert document batch...
2025-11-14 17:16:32,664 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 17:16:33,234 - INFO - Finished converting document 10-Q_2025-05-01 in 0.89 sec.
2025-11-14 17:16:33,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-Q_2025-05-01' --> 'data\processed_data\META\10-Q_2025-05-01.md'


2025-11-14 17:16:33,924 - INFO - Going to convert document batch...
2025-11-14 17:16:33,925 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 17:16:34,945 - INFO - Finished converting document 10-Q_2025-07-31 in 1.39 sec.
2025-11-14 17:16:35,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\10-Q_2025-07-31' --> 'data\processed_data\META\10-Q_2025-07-31.md'


2025-11-14 17:16:35,748 - INFO - Going to convert document batch...
2025-11-14 17:16:35,749 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 17:16:36,422 - INFO - Finished converting document 10-Q_2025-10-30 in 1.14 sec.
2025-11-14 17:16:36,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:36,792 - INFO - Going to convert document batch...
2025-11-14 17:16:36,793 - INFO - Processing document 4_2023-01-06
2025-11-14 17:16:36,811 - INFO - Finished converting document 4_2023-01-06 in 0.05 sec.
2025-11-14 17:16:36,844 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:36,852 - INFO - Going to convert document batch...
2025-11-14 17:16:36,852 - INFO - Processing document 4_2023-01-11
2025-11-14 17:16:36,870 - INFO - Finished converting document 4_2023-01-11 in 0.05 sec.
2025-11-14 17:16:36,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:36,930 - INFO - Going to convert document batch...
2025-11-14 17:16:36,

Converted 'data\edgar_documents\META\10-Q_2025-10-30' --> 'data\processed_data\META\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\META\4_2023-01-06' --> 'data\processed_data\META\4_2023-01-06.md'
Converted 'data\edgar_documents\META\4_2023-01-11' --> 'data\processed_data\META\4_2023-01-11.md'


2025-11-14 17:16:36,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:36,999 - INFO - Going to convert document batch...
2025-11-14 17:16:37,000 - INFO - Processing document 4_2023-01-27
2025-11-14 17:16:37,034 - INFO - Finished converting document 4_2023-01-27 in 0.06 sec.
2025-11-14 17:16:37,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,093 - INFO - Going to convert document batch...
2025-11-14 17:16:37,094 - INFO - Processing document 4_2023-02-03
2025-11-14 17:16:37,113 - INFO - Finished converting document 4_2023-02-03 in 0.05 sec.
2025-11-14 17:16:37,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,148 - INFO - Going to convert document batch...
2025-11-14 17:16:37,149 - INFO - Processing document 4_2023-02-09


Converted 'data\edgar_documents\META\4_2023-01-20' --> 'data\processed_data\META\4_2023-01-20.md'
Converted 'data\edgar_documents\META\4_2023-01-27' --> 'data\processed_data\META\4_2023-01-27.md'
Converted 'data\edgar_documents\META\4_2023-02-03' --> 'data\processed_data\META\4_2023-02-03.md'


2025-11-14 17:16:37,166 - INFO - Finished converting document 4_2023-02-09 in 0.05 sec.
2025-11-14 17:16:37,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,205 - INFO - Going to convert document batch...
2025-11-14 17:16:37,206 - INFO - Processing document 4_2023-02-10
2025-11-14 17:16:37,226 - INFO - Finished converting document 4_2023-02-10 in 0.03 sec.
2025-11-14 17:16:37,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,265 - INFO - Going to convert document batch...
2025-11-14 17:16:37,265 - INFO - Processing document 4_2023-02-17
2025-11-14 17:16:37,285 - INFO - Finished converting document 4_2023-02-17 in 0.03 sec.
2025-11-14 17:16:37,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,325 - INFO - Going to convert document batch...
2025-11-14 17:16:37,325 - INFO - Processing document 4_2023-02-21
2025-11-14 17:16:37,345 - INFO - Finished converting document 4_2023-02-21 in 0.05 sec.


Converted 'data\edgar_documents\META\4_2023-02-09' --> 'data\processed_data\META\4_2023-02-09.md'
Converted 'data\edgar_documents\META\4_2023-02-10' --> 'data\processed_data\META\4_2023-02-10.md'
Converted 'data\edgar_documents\META\4_2023-02-17' --> 'data\processed_data\META\4_2023-02-17.md'
Converted 'data\edgar_documents\META\4_2023-02-21' --> 'data\processed_data\META\4_2023-02-21.md'


2025-11-14 17:16:37,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,409 - INFO - Going to convert document batch...
2025-11-14 17:16:37,410 - INFO - Processing document 4_2023-02-22
2025-11-14 17:16:37,434 - INFO - Finished converting document 4_2023-02-22 in 0.08 sec.
2025-11-14 17:16:37,471 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,478 - INFO - Going to convert document batch...
2025-11-14 17:16:37,480 - INFO - Processing document 4_2023-03-02
2025-11-14 17:16:37,497 - INFO - Finished converting document 4_2023-03-02 in 0.05 sec.
2025-11-14 17:16:37,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,537 - INFO - Going to convert document batch...
2025-11-14 17:16:37,538 - INFO - Processing document 4_2023-03-09
2025-11-14 17:16:37,554 - INFO - Finished converting document 4_2023-03-09 in 0.03 sec.
2025-11-14 17:16:37,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\META\4_2023-02-22' --> 'data\processed_data\META\4_2023-02-22.md'
Converted 'data\edgar_documents\META\4_2023-03-02' --> 'data\processed_data\META\4_2023-03-02.md'
Converted 'data\edgar_documents\META\4_2023-03-09' --> 'data\processed_data\META\4_2023-03-09.md'
Converted 'data\edgar_documents\META\4_2023-03-16' --> 'data\processed_data\META\4_2023-03-16.md'


2025-11-14 17:16:37,648 - INFO - Going to convert document batch...
2025-11-14 17:16:37,649 - INFO - Processing document 4_2023-03-22
2025-11-14 17:16:37,668 - INFO - Finished converting document 4_2023-03-22 in 0.05 sec.
2025-11-14 17:16:37,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,734 - INFO - Going to convert document batch...
2025-11-14 17:16:37,735 - INFO - Processing document 4_2023-03-29
2025-11-14 17:16:37,759 - INFO - Finished converting document 4_2023-03-29 in 0.05 sec.
2025-11-14 17:16:37,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,802 - INFO - Going to convert document batch...
2025-11-14 17:16:37,803 - INFO - Processing document 4_2023-04-06
2025-11-14 17:16:37,830 - INFO - Finished converting document 4_2023-04-06 in 0.05 sec.
2025-11-14 17:16:37,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,870 - INFO - Going to convert document batch...
2025-11-14 17:16:37,871 - 

Converted 'data\edgar_documents\META\4_2023-03-22' --> 'data\processed_data\META\4_2023-03-22.md'
Converted 'data\edgar_documents\META\4_2023-03-29' --> 'data\processed_data\META\4_2023-03-29.md'
Converted 'data\edgar_documents\META\4_2023-04-06' --> 'data\processed_data\META\4_2023-04-06.md'


2025-11-14 17:16:37,889 - INFO - Finished converting document 4_2023-04-12 in 0.05 sec.
2025-11-14 17:16:37,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,935 - INFO - Going to convert document batch...
2025-11-14 17:16:37,935 - INFO - Processing document 4_2023-04-20
2025-11-14 17:16:37,954 - INFO - Finished converting document 4_2023-04-20 in 0.05 sec.
2025-11-14 17:16:37,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:37,999 - INFO - Going to convert document batch...
2025-11-14 17:16:37,999 - INFO - Processing document 4_2023-04-27
2025-11-14 17:16:38,016 - INFO - Finished converting document 4_2023-04-27 in 0.03 sec.
2025-11-14 17:16:38,062 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:16:38,063 - ERROR - Input document 4_2023-05-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFo

Converted 'data\edgar_documents\META\4_2023-04-12' --> 'data\processed_data\META\4_2023-04-12.md'
Converted 'data\edgar_documents\META\4_2023-04-20' --> 'data\processed_data\META\4_2023-04-20.md'
Converted 'data\edgar_documents\META\4_2023-04-27' --> 'data\processed_data\META\4_2023-04-27.md'
Error processing data\edgar_documents\META\4_2023-05-01: File format not allowed: data\edgar_documents\META\4_2023-05-01
Error processing data\edgar_documents\META\4_2023-05-02: File format not allowed: data\edgar_documents\META\4_2023-05-02


2025-11-14 17:16:38,101 - INFO - Going to convert document batch...
2025-11-14 17:16:38,102 - INFO - Processing document 4_2023-05-03
2025-11-14 17:16:38,120 - INFO - Finished converting document 4_2023-05-03 in 0.05 sec.
2025-11-14 17:16:38,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:38,164 - INFO - Going to convert document batch...
2025-11-14 17:16:38,165 - INFO - Processing document 4_2023-05-10
2025-11-14 17:16:38,183 - INFO - Finished converting document 4_2023-05-10 in 0.05 sec.
2025-11-14 17:16:38,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:38,234 - INFO - Going to convert document batch...
2025-11-14 17:16:38,234 - INFO - Processing document 4_2023-05-17
2025-11-14 17:16:38,267 - INFO - Finished converting document 4_2023-05-17 in 0.06 sec.
2025-11-14 17:16:38,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:38,321 - INFO - Going to convert document batch...
2025-11-14 17:16:38,322 - 

Converted 'data\edgar_documents\META\4_2023-05-03' --> 'data\processed_data\META\4_2023-05-03.md'
Converted 'data\edgar_documents\META\4_2023-05-10' --> 'data\processed_data\META\4_2023-05-10.md'
Converted 'data\edgar_documents\META\4_2023-05-17' --> 'data\processed_data\META\4_2023-05-17.md'


2025-11-14 17:16:38,701 - INFO - Finished converting document 4_2023-05-19 in 0.41 sec.
2025-11-14 17:16:38,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:38,750 - INFO - Going to convert document batch...
2025-11-14 17:16:38,751 - INFO - Processing document 4_2023-05-24
2025-11-14 17:16:38,769 - INFO - Finished converting document 4_2023-05-24 in 0.05 sec.
2025-11-14 17:16:38,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:38,811 - INFO - Going to convert document batch...
2025-11-14 17:16:38,812 - INFO - Processing document 4_2023-05-25
2025-11-14 17:16:38,830 - INFO - Finished converting document 4_2023-05-25 in 0.03 sec.
2025-11-14 17:16:38,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:38,870 - INFO - Going to convert document batch...
2025-11-14 17:16:38,871 - INFO - Processing document 4_2023-06-01
2025-11-14 17:16:38,887 - INFO - Finished converting document 4_2023-06-01 in 0.05 sec.


Converted 'data\edgar_documents\META\4_2023-05-19' --> 'data\processed_data\META\4_2023-05-19.md'
Converted 'data\edgar_documents\META\4_2023-05-24' --> 'data\processed_data\META\4_2023-05-24.md'
Converted 'data\edgar_documents\META\4_2023-05-25' --> 'data\processed_data\META\4_2023-05-25.md'


2025-11-14 17:16:38,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:38,930 - INFO - Going to convert document batch...
2025-11-14 17:16:38,931 - INFO - Processing document 4_2023-06-08
2025-11-14 17:16:38,951 - INFO - Finished converting document 4_2023-06-08 in 0.05 sec.
2025-11-14 17:16:38,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:38,997 - INFO - Going to convert document batch...
2025-11-14 17:16:38,997 - INFO - Processing document 4_2023-06-15
2025-11-14 17:16:39,016 - INFO - Finished converting document 4_2023-06-15 in 0.05 sec.
2025-11-14 17:16:39,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,076 - INFO - Going to convert document batch...
2025-11-14 17:16:39,077 - INFO - Processing document 4_2023-06-16
2025-11-14 17:16:39,098 - INFO - Finished converting document 4_2023-06-16 in 0.06 sec.


Converted 'data\edgar_documents\META\4_2023-06-01' --> 'data\processed_data\META\4_2023-06-01.md'
Converted 'data\edgar_documents\META\4_2023-06-08' --> 'data\processed_data\META\4_2023-06-08.md'
Converted 'data\edgar_documents\META\4_2023-06-15' --> 'data\processed_data\META\4_2023-06-15.md'


2025-11-14 17:16:39,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,142 - INFO - Going to convert document batch...
2025-11-14 17:16:39,143 - INFO - Processing document 4_2023-06-22
2025-11-14 17:16:39,163 - INFO - Finished converting document 4_2023-06-22 in 0.03 sec.
2025-11-14 17:16:39,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,210 - INFO - Going to convert document batch...
2025-11-14 17:16:39,211 - INFO - Processing document 4_2023-06-29
2025-11-14 17:16:39,229 - INFO - Finished converting document 4_2023-06-29 in 0.05 sec.
2025-11-14 17:16:39,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,270 - INFO - Going to convert document batch...
2025-11-14 17:16:39,271 - INFO - Processing document 4_2023-07-05
2025-11-14 17:16:39,288 - INFO - Finished converting document 4_2023-07-05 in 0.03 sec.
2025-11-14 17:16:39,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2023-06-16' --> 'data\processed_data\META\4_2023-06-16.md'
Converted 'data\edgar_documents\META\4_2023-06-22' --> 'data\processed_data\META\4_2023-06-22.md'
Converted 'data\edgar_documents\META\4_2023-06-29' --> 'data\processed_data\META\4_2023-06-29.md'
Converted 'data\edgar_documents\META\4_2023-07-05' --> 'data\processed_data\META\4_2023-07-05.md'


2025-11-14 17:16:39,329 - INFO - Going to convert document batch...
2025-11-14 17:16:39,330 - INFO - Processing document 4_2023-07-13
2025-11-14 17:16:39,348 - INFO - Finished converting document 4_2023-07-13 in 0.03 sec.
2025-11-14 17:16:39,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,394 - INFO - Going to convert document batch...
2025-11-14 17:16:39,394 - INFO - Processing document 4_2023-07-20
2025-11-14 17:16:39,412 - INFO - Finished converting document 4_2023-07-20 in 0.03 sec.
2025-11-14 17:16:39,456 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,465 - INFO - Going to convert document batch...
2025-11-14 17:16:39,465 - INFO - Processing document 4_2023-07-27
2025-11-14 17:16:39,483 - INFO - Finished converting document 4_2023-07-27 in 0.06 sec.
2025-11-14 17:16:39,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,518 - INFO - Going to convert document batch...
2025-11-14 17:16:39,519 - 

Converted 'data\edgar_documents\META\4_2023-07-13' --> 'data\processed_data\META\4_2023-07-13.md'
Converted 'data\edgar_documents\META\4_2023-07-20' --> 'data\processed_data\META\4_2023-07-20.md'
Converted 'data\edgar_documents\META\4_2023-07-27' --> 'data\processed_data\META\4_2023-07-27.md'
Converted 'data\edgar_documents\META\4_2023-08-03' --> 'data\processed_data\META\4_2023-08-03.md'


2025-11-14 17:16:39,584 - INFO - Going to convert document batch...
2025-11-14 17:16:39,585 - INFO - Processing document 4_2023-08-09
2025-11-14 17:16:39,637 - INFO - Finished converting document 4_2023-08-09 in 0.09 sec.
2025-11-14 17:16:39,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,694 - INFO - Going to convert document batch...
2025-11-14 17:16:39,695 - INFO - Processing document 4_2023-08-10
2025-11-14 17:16:39,713 - INFO - Finished converting document 4_2023-08-10 in 0.03 sec.
2025-11-14 17:16:39,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,771 - INFO - Going to convert document batch...
2025-11-14 17:16:39,771 - INFO - Processing document 4_2023-08-17
2025-11-14 17:16:39,791 - INFO - Finished converting document 4_2023-08-17 in 0.06 sec.
2025-11-14 17:16:39,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,831 - INFO - Going to convert document batch...
2025-11-14 17:16:39,832 - 

Converted 'data\edgar_documents\META\4_2023-08-09' --> 'data\processed_data\META\4_2023-08-09.md'
Converted 'data\edgar_documents\META\4_2023-08-10' --> 'data\processed_data\META\4_2023-08-10.md'
Converted 'data\edgar_documents\META\4_2023-08-17' --> 'data\processed_data\META\4_2023-08-17.md'


2025-11-14 17:16:39,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,895 - INFO - Going to convert document batch...
2025-11-14 17:16:39,896 - INFO - Processing document 4_2023-08-23
2025-11-14 17:16:39,917 - INFO - Finished converting document 4_2023-08-23 in 0.05 sec.
2025-11-14 17:16:39,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:39,964 - INFO - Going to convert document batch...
2025-11-14 17:16:39,965 - INFO - Processing document 4_2023-08-24
2025-11-14 17:16:39,983 - INFO - Finished converting document 4_2023-08-24 in 0.05 sec.
2025-11-14 17:16:40,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,046 - INFO - Going to convert document batch...
2025-11-14 17:16:40,047 - INFO - Processing document 4_2023-08-31
2025-11-14 17:16:40,068 - INFO - Finished converting document 4_2023-08-31 in 0.06 sec.


Converted 'data\edgar_documents\META\4_2023-08-18' --> 'data\processed_data\META\4_2023-08-18.md'
Converted 'data\edgar_documents\META\4_2023-08-23' --> 'data\processed_data\META\4_2023-08-23.md'
Converted 'data\edgar_documents\META\4_2023-08-24' --> 'data\processed_data\META\4_2023-08-24.md'


2025-11-14 17:16:40,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,106 - INFO - Going to convert document batch...
2025-11-14 17:16:40,107 - INFO - Processing document 4_2023-09-07
2025-11-14 17:16:40,129 - INFO - Finished converting document 4_2023-09-07 in 0.05 sec.
2025-11-14 17:16:40,176 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,190 - INFO - Going to convert document batch...
2025-11-14 17:16:40,191 - INFO - Processing document 4_2023-09-14
2025-11-14 17:16:40,228 - INFO - Finished converting document 4_2023-09-14 in 0.08 sec.
2025-11-14 17:16:40,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2023-08-31' --> 'data\processed_data\META\4_2023-08-31.md'
Converted 'data\edgar_documents\META\4_2023-09-07' --> 'data\processed_data\META\4_2023-09-07.md'
Converted 'data\edgar_documents\META\4_2023-09-14' --> 'data\processed_data\META\4_2023-09-14.md'


2025-11-14 17:16:40,267 - INFO - Going to convert document batch...
2025-11-14 17:16:40,268 - INFO - Processing document 4_2023-09-21
2025-11-14 17:16:40,286 - INFO - Finished converting document 4_2023-09-21 in 0.03 sec.
2025-11-14 17:16:40,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,324 - INFO - Going to convert document batch...
2025-11-14 17:16:40,325 - INFO - Processing document 4_2023-09-28
2025-11-14 17:16:40,342 - INFO - Finished converting document 4_2023-09-28 in 0.05 sec.
2025-11-14 17:16:40,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,380 - INFO - Going to convert document batch...
2025-11-14 17:16:40,380 - INFO - Processing document 4_2023-10-05
2025-11-14 17:16:40,397 - INFO - Finished converting document 4_2023-10-05 in 0.03 sec.
2025-11-14 17:16:40,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,435 - INFO - Going to convert document batch...
2025-11-14 17:16:40,436 - 

Converted 'data\edgar_documents\META\4_2023-09-21' --> 'data\processed_data\META\4_2023-09-21.md'
Converted 'data\edgar_documents\META\4_2023-09-28' --> 'data\processed_data\META\4_2023-09-28.md'
Converted 'data\edgar_documents\META\4_2023-10-05' --> 'data\processed_data\META\4_2023-10-05.md'
Converted 'data\edgar_documents\META\4_2023-10-12' --> 'data\processed_data\META\4_2023-10-12.md'


2025-11-14 17:16:40,494 - INFO - Going to convert document batch...
2025-11-14 17:16:40,494 - INFO - Processing document 4_2023-10-19
2025-11-14 17:16:40,511 - INFO - Finished converting document 4_2023-10-19 in 0.05 sec.
2025-11-14 17:16:40,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,551 - INFO - Going to convert document batch...
2025-11-14 17:16:40,551 - INFO - Processing document 4_2023-10-26
2025-11-14 17:16:40,578 - INFO - Finished converting document 4_2023-10-26 in 0.05 sec.
2025-11-14 17:16:40,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,635 - INFO - Going to convert document batch...
2025-11-14 17:16:40,636 - INFO - Processing document 4_2023-11-02
2025-11-14 17:16:40,654 - INFO - Finished converting document 4_2023-11-02 in 0.05 sec.
2025-11-14 17:16:40,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,736 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2023-10-19' --> 'data\processed_data\META\4_2023-10-19.md'
Converted 'data\edgar_documents\META\4_2023-10-26' --> 'data\processed_data\META\4_2023-10-26.md'
Converted 'data\edgar_documents\META\4_2023-11-02' --> 'data\processed_data\META\4_2023-11-02.md'


2025-11-14 17:16:40,738 - INFO - Processing document 4_2023-11-03
2025-11-14 17:16:40,820 - INFO - Finished converting document 4_2023-11-03 in 0.14 sec.
2025-11-14 17:16:40,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:40,909 - INFO - Going to convert document batch...
2025-11-14 17:16:40,910 - INFO - Processing document 4_2023-11-07
2025-11-14 17:16:40,961 - INFO - Finished converting document 4_2023-11-07 in 0.08 sec.
2025-11-14 17:16:41,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:41,062 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2023-11-03' --> 'data\processed_data\META\4_2023-11-03.md'
Converted 'data\edgar_documents\META\4_2023-11-07' --> 'data\processed_data\META\4_2023-11-07.md'


2025-11-14 17:16:41,063 - INFO - Processing document 4_2023-11-09
2025-11-14 17:16:41,129 - INFO - Finished converting document 4_2023-11-09 in 0.12 sec.
2025-11-14 17:16:41,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:41,222 - INFO - Going to convert document batch...
2025-11-14 17:16:41,223 - INFO - Processing document 4_2023-11-13
2025-11-14 17:16:41,299 - INFO - Finished converting document 4_2023-11-13 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2023-11-09' --> 'data\processed_data\META\4_2023-11-09.md'
Converted 'data\edgar_documents\META\4_2023-11-13' --> 'data\processed_data\META\4_2023-11-13.md'


2025-11-14 17:16:41,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:41,422 - INFO - Going to convert document batch...
2025-11-14 17:16:41,424 - INFO - Processing document 4_2023-11-15
2025-11-14 17:16:41,511 - INFO - Finished converting document 4_2023-11-15 in 0.16 sec.
2025-11-14 17:16:41,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:41,614 - INFO - Going to convert document batch...
2025-11-14 17:16:41,614 - INFO - Processing document 4_2023-11-17
2025-11-14 17:16:41,633 - INFO - Finished converting document 4_2023-11-17 in 0.06 sec.
2025-11-14 17:16:41,666 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:41,689 - INFO - Going to convert document batch...
2025-11-14 17:16:41,690 - INFO - Processing document 4_2023-11-20
2025-11-14 17:16:41,750 - INFO - Finished converting document 4_2023-11-20 in 0.09 sec.


Converted 'data\edgar_documents\META\4_2023-11-15' --> 'data\processed_data\META\4_2023-11-15.md'
Converted 'data\edgar_documents\META\4_2023-11-17' --> 'data\processed_data\META\4_2023-11-17.md'


2025-11-14 17:16:41,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:41,835 - INFO - Going to convert document batch...
2025-11-14 17:16:41,836 - INFO - Processing document 4_2023-11-22
2025-11-14 17:16:41,888 - INFO - Finished converting document 4_2023-11-22 in 0.09 sec.
2025-11-14 17:16:41,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:41,989 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2023-11-20' --> 'data\processed_data\META\4_2023-11-20.md'
Converted 'data\edgar_documents\META\4_2023-11-22' --> 'data\processed_data\META\4_2023-11-22.md'


2025-11-14 17:16:41,989 - INFO - Processing document 4_2023-11-27
2025-11-14 17:16:42,263 - INFO - Finished converting document 4_2023-11-27 in 0.33 sec.
2025-11-14 17:16:42,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:42,351 - INFO - Going to convert document batch...
2025-11-14 17:16:42,353 - INFO - Processing document 4_2023-11-29
2025-11-14 17:16:42,419 - INFO - Finished converting document 4_2023-11-29 in 0.11 sec.
2025-11-14 17:16:42,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2023-11-27' --> 'data\processed_data\META\4_2023-11-27.md'
Converted 'data\edgar_documents\META\4_2023-11-29' --> 'data\processed_data\META\4_2023-11-29.md'


2025-11-14 17:16:42,508 - INFO - Going to convert document batch...
2025-11-14 17:16:42,509 - INFO - Processing document 4_2023-11-30
2025-11-14 17:16:42,525 - INFO - Finished converting document 4_2023-11-30 in 0.05 sec.
2025-11-14 17:16:42,558 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:42,568 - INFO - Going to convert document batch...
2025-11-14 17:16:42,568 - INFO - Processing document 4_2023-12-01
2025-11-14 17:16:42,588 - INFO - Finished converting document 4_2023-12-01 in 0.05 sec.
2025-11-14 17:16:42,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:42,667 - INFO - Going to convert document batch...
2025-11-14 17:16:42,668 - INFO - Processing document 4_2023-12-04
2025-11-14 17:16:42,727 - INFO - Finished converting document 4_2023-12-04 in 0.09 sec.


Converted 'data\edgar_documents\META\4_2023-11-30' --> 'data\processed_data\META\4_2023-11-30.md'
Converted 'data\edgar_documents\META\4_2023-12-01' --> 'data\processed_data\META\4_2023-12-01.md'


2025-11-14 17:16:42,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:42,810 - INFO - Going to convert document batch...
2025-11-14 17:16:42,811 - INFO - Processing document 4_2023-12-06
2025-11-14 17:16:42,874 - INFO - Finished converting document 4_2023-12-06 in 0.09 sec.
2025-11-14 17:16:42,932 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:42,940 - INFO - Going to convert document batch...
2025-11-14 17:16:42,940 - INFO - Processing document 4_2023-12-07
2025-11-14 17:16:42,958 - INFO - Finished converting document 4_2023-12-07 in 0.03 sec.


Converted 'data\edgar_documents\META\4_2023-12-04' --> 'data\processed_data\META\4_2023-12-04.md'
Converted 'data\edgar_documents\META\4_2023-12-06' --> 'data\processed_data\META\4_2023-12-06.md'


2025-11-14 17:16:42,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:43,023 - INFO - Going to convert document batch...
2025-11-14 17:16:43,024 - INFO - Processing document 4_2023-12-11
2025-11-14 17:16:43,130 - INFO - Finished converting document 4_2023-12-11 in 0.16 sec.


Converted 'data\edgar_documents\META\4_2023-12-07' --> 'data\processed_data\META\4_2023-12-07.md'


2025-11-14 17:16:43,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:43,226 - INFO - Going to convert document batch...
2025-11-14 17:16:43,227 - INFO - Processing document 4_2023-12-13
2025-11-14 17:16:43,290 - INFO - Finished converting document 4_2023-12-13 in 0.09 sec.
2025-11-14 17:16:43,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:43,358 - INFO - Going to convert document batch...
2025-11-14 17:16:43,358 - INFO - Processing document 4_2023-12-14


Converted 'data\edgar_documents\META\4_2023-12-11' --> 'data\processed_data\META\4_2023-12-11.md'
Converted 'data\edgar_documents\META\4_2023-12-13' --> 'data\processed_data\META\4_2023-12-13.md'


2025-11-14 17:16:43,376 - INFO - Finished converting document 4_2023-12-14 in 0.03 sec.
2025-11-14 17:16:43,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:43,459 - INFO - Going to convert document batch...
2025-11-14 17:16:43,460 - INFO - Processing document 4_2023-12-18
2025-11-14 17:16:43,531 - INFO - Finished converting document 4_2023-12-18 in 0.14 sec.


Converted 'data\edgar_documents\META\4_2023-12-14' --> 'data\processed_data\META\4_2023-12-14.md'
Converted 'data\edgar_documents\META\4_2023-12-18' --> 'data\processed_data\META\4_2023-12-18.md'


2025-11-14 17:16:43,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:43,624 - INFO - Going to convert document batch...
2025-11-14 17:16:43,625 - INFO - Processing document 4_2023-12-20
2025-11-14 17:16:43,696 - INFO - Finished converting document 4_2023-12-20 in 0.11 sec.
2025-11-14 17:16:43,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:43,766 - INFO - Going to convert document batch...
2025-11-14 17:16:43,767 - INFO - Processing document 4_2023-12-21
2025-11-14 17:16:43,786 - INFO - Finished converting document 4_2023-12-21 in 0.03 sec.
2025-11-14 17:16:43,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:43,865 - INFO - Going to convert document batch...
2025-11-14 17:16:43,866 - INFO - Processing document 4_2023-12-26
2025-11-14 17:16:43,931 - INFO - Finished converting document 4_2023-12-26 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2023-12-20' --> 'data\processed_data\META\4_2023-12-20.md'
Converted 'data\edgar_documents\META\4_2023-12-21' --> 'data\processed_data\META\4_2023-12-21.md'


2025-11-14 17:16:43,993 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:44,015 - INFO - Going to convert document batch...
2025-11-14 17:16:44,016 - INFO - Processing document 4_2023-12-27
2025-11-14 17:16:44,072 - INFO - Finished converting document 4_2023-12-27 in 0.08 sec.
2025-11-14 17:16:44,126 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:44,133 - INFO - Going to convert document batch...
2025-11-14 17:16:44,134 - INFO - Processing document 4_2023-12-28
2025-11-14 17:16:44,151 - INFO - Finished converting document 4_2023-12-28 in 0.05 sec.


Converted 'data\edgar_documents\META\4_2023-12-26' --> 'data\processed_data\META\4_2023-12-26.md'
Converted 'data\edgar_documents\META\4_2023-12-27' --> 'data\processed_data\META\4_2023-12-27.md'
Converted 'data\edgar_documents\META\4_2023-12-28' --> 'data\processed_data\META\4_2023-12-28.md'


2025-11-14 17:16:44,198 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:44,234 - INFO - Going to convert document batch...
2025-11-14 17:16:44,235 - INFO - Processing document 4_2024-01-02
2025-11-14 17:16:44,335 - INFO - Finished converting document 4_2024-01-02 in 0.16 sec.
2025-11-14 17:16:44,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:44,415 - INFO - Going to convert document batch...
2025-11-14 17:16:44,415 - INFO - Processing document 4_2024-01-03
2025-11-14 17:16:44,433 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 17:16:44,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:44,484 - INFO - Going to convert document batch...
2025-11-14 17:16:44,485 - INFO - Processing document 4_2024-01-08
2025-11-14 17:16:44,537 - INFO - Finished converting document 4_2024-01-08 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-01-02' --> 'data\processed_data\META\4_2024-01-02.md'
Converted 'data\edgar_documents\META\4_2024-01-03' --> 'data\processed_data\META\4_2024-01-03.md'
Converted 'data\edgar_documents\META\4_2024-01-08' --> 'data\processed_data\META\4_2024-01-08.md'


2025-11-14 17:16:44,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:44,609 - INFO - Going to convert document batch...
2025-11-14 17:16:44,609 - INFO - Processing document 4_2024-01-10
2025-11-14 17:16:44,665 - INFO - Finished converting document 4_2024-01-10 in 0.08 sec.
2025-11-14 17:16:44,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:44,744 - INFO - Going to convert document batch...
2025-11-14 17:16:44,745 - INFO - Processing document 4_2024-01-11
2025-11-14 17:16:44,763 - INFO - Finished converting document 4_2024-01-11 in 0.06 sec.
2025-11-14 17:16:44,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:44,835 - INFO - Going to convert document batch...
2025-11-14 17:16:44,836 - INFO - Processing document 4_2024-01-16


Converted 'data\edgar_documents\META\4_2024-01-10' --> 'data\processed_data\META\4_2024-01-10.md'
Converted 'data\edgar_documents\META\4_2024-01-11' --> 'data\processed_data\META\4_2024-01-11.md'


2025-11-14 17:16:44,901 - INFO - Finished converting document 4_2024-01-16 in 0.12 sec.
2025-11-14 17:16:44,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2024-01-16' --> 'data\processed_data\META\4_2024-01-16.md'


2025-11-14 17:16:45,229 - INFO - Going to convert document batch...
2025-11-14 17:16:45,230 - INFO - Processing document 4_2024-01-17
2025-11-14 17:16:45,311 - INFO - Finished converting document 4_2024-01-17 in 0.34 sec.
2025-11-14 17:16:45,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:45,396 - INFO - Going to convert document batch...
2025-11-14 17:16:45,397 - INFO - Processing document 4_2024-01-18
2025-11-14 17:16:45,413 - INFO - Finished converting document 4_2024-01-18 in 0.03 sec.
2025-11-14 17:16:45,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:45,468 - INFO - Going to convert document batch...
2025-11-14 17:16:45,469 - INFO - Processing document 4_2024-01-22
2025-11-14 17:16:45,534 - INFO - Finished converting document 4_2024-01-22 in 0.09 sec.


Converted 'data\edgar_documents\META\4_2024-01-17' --> 'data\processed_data\META\4_2024-01-17.md'
Converted 'data\edgar_documents\META\4_2024-01-18' --> 'data\processed_data\META\4_2024-01-18.md'


2025-11-14 17:16:45,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:45,629 - INFO - Going to convert document batch...
2025-11-14 17:16:45,629 - INFO - Processing document 4_2024-01-24
2025-11-14 17:16:45,705 - INFO - Finished converting document 4_2024-01-24 in 0.11 sec.
2025-11-14 17:16:45,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2024-01-22' --> 'data\processed_data\META\4_2024-01-22.md'
Converted 'data\edgar_documents\META\4_2024-01-24' --> 'data\processed_data\META\4_2024-01-24.md'


2025-11-14 17:16:45,780 - INFO - Going to convert document batch...
2025-11-14 17:16:45,781 - INFO - Processing document 4_2024-01-25
2025-11-14 17:16:45,798 - INFO - Finished converting document 4_2024-01-25 in 0.03 sec.
2025-11-14 17:16:45,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:45,840 - INFO - Going to convert document batch...
2025-11-14 17:16:45,840 - INFO - Processing document 4_2024-01-26
2025-11-14 17:16:45,863 - INFO - Finished converting document 4_2024-01-26 in 0.05 sec.
2025-11-14 17:16:45,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:45,919 - INFO - Going to convert document batch...
2025-11-14 17:16:45,920 - INFO - Processing document 4_2024-01-29
2025-11-14 17:16:45,984 - INFO - Finished converting document 4_2024-01-29 in 0.11 sec.


Converted 'data\edgar_documents\META\4_2024-01-25' --> 'data\processed_data\META\4_2024-01-25.md'
Converted 'data\edgar_documents\META\4_2024-01-26' --> 'data\processed_data\META\4_2024-01-26.md'


2025-11-14 17:16:46,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:46,081 - INFO - Going to convert document batch...
2025-11-14 17:16:46,082 - INFO - Processing document 4_2024-01-31
2025-11-14 17:16:46,198 - INFO - Finished converting document 4_2024-01-31 in 0.17 sec.


Converted 'data\edgar_documents\META\4_2024-01-29' --> 'data\processed_data\META\4_2024-01-29.md'


2025-11-14 17:16:46,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:46,286 - INFO - Going to convert document batch...
2025-11-14 17:16:46,286 - INFO - Processing document 4_2024-02-01
2025-11-14 17:16:46,304 - INFO - Finished converting document 4_2024-02-01 in 0.03 sec.
2025-11-14 17:16:46,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:46,367 - INFO - Going to convert document batch...
2025-11-14 17:16:46,368 - INFO - Processing document 4_2024-02-05
2025-11-14 17:16:46,449 - INFO - Finished converting document 4_2024-02-05 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2024-01-31' --> 'data\processed_data\META\4_2024-01-31.md'
Converted 'data\edgar_documents\META\4_2024-02-01' --> 'data\processed_data\META\4_2024-02-01.md'


2025-11-14 17:16:46,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:46,582 - INFO - Going to convert document batch...
2025-11-14 17:16:46,582 - INFO - Processing document 4_2024-02-07
2025-11-14 17:16:46,661 - INFO - Finished converting document 4_2024-02-07 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2024-02-05' --> 'data\processed_data\META\4_2024-02-05.md'
Converted 'data\edgar_documents\META\4_2024-02-07' --> 'data\processed_data\META\4_2024-02-07.md'


2025-11-14 17:16:46,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:46,786 - INFO - Going to convert document batch...
2025-11-14 17:16:46,787 - INFO - Processing document 4_2024-02-12
2025-11-14 17:16:46,871 - INFO - Finished converting document 4_2024-02-12 in 0.16 sec.
2025-11-14 17:16:46,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:46,991 - INFO - Going to convert document batch...
2025-11-14 17:16:46,992 - INFO - Processing document 4_2024-02-14
2025-11-14 17:16:47,051 - INFO - Finished converting document 4_2024-02-14 in 0.12 sec.
2025-11-14 17:16:47,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2024-02-12' --> 'data\processed_data\META\4_2024-02-12.md'
Converted 'data\edgar_documents\META\4_2024-02-14' --> 'data\processed_data\META\4_2024-02-14.md'


2025-11-14 17:16:47,124 - INFO - Going to convert document batch...
2025-11-14 17:16:47,125 - INFO - Processing document 4_2024-02-20
2025-11-14 17:16:47,145 - INFO - Finished converting document 4_2024-02-20 in 0.05 sec.
2025-11-14 17:16:47,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:47,218 - INFO - Going to convert document batch...
2025-11-14 17:16:47,219 - INFO - Processing document 4_2024-02-21
2025-11-14 17:16:47,309 - INFO - Finished converting document 4_2024-02-21 in 0.14 sec.


Converted 'data\edgar_documents\META\4_2024-02-20' --> 'data\processed_data\META\4_2024-02-20.md'


2025-11-14 17:16:47,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:47,398 - INFO - Going to convert document batch...
2025-11-14 17:16:47,399 - INFO - Processing document 4_2024-02-22
2025-11-14 17:16:47,416 - INFO - Finished converting document 4_2024-02-22 in 0.05 sec.
2025-11-14 17:16:47,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:47,488 - INFO - Going to convert document batch...
2025-11-14 17:16:47,489 - INFO - Processing document 4_2024-02-26
2025-11-14 17:16:47,544 - INFO - Finished converting document 4_2024-02-26 in 0.11 sec.


Converted 'data\edgar_documents\META\4_2024-02-21' --> 'data\processed_data\META\4_2024-02-21.md'
Converted 'data\edgar_documents\META\4_2024-02-22' --> 'data\processed_data\META\4_2024-02-22.md'


2025-11-14 17:16:47,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:47,612 - INFO - Going to convert document batch...
2025-11-14 17:16:47,612 - INFO - Processing document 4_2024-02-27
2025-11-14 17:16:47,636 - INFO - Finished converting document 4_2024-02-27 in 0.05 sec.
2025-11-14 17:16:47,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2024-02-26' --> 'data\processed_data\META\4_2024-02-26.md'
Converted 'data\edgar_documents\META\4_2024-02-27' --> 'data\processed_data\META\4_2024-02-27.md'


2025-11-14 17:16:47,908 - INFO - Going to convert document batch...
2025-11-14 17:16:47,909 - INFO - Processing document 4_2024-02-28
2025-11-14 17:16:47,995 - INFO - Finished converting document 4_2024-02-28 in 0.34 sec.
2025-11-14 17:16:48,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:48,102 - INFO - Going to convert document batch...
2025-11-14 17:16:48,104 - INFO - Processing document 4_2024-02-29
2025-11-14 17:16:48,120 - INFO - Finished converting document 4_2024-02-29 in 0.06 sec.
2025-11-14 17:16:48,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:48,170 - INFO - Going to convert document batch...
2025-11-14 17:16:48,171 - INFO - Processing document 4_2024-03-04
2025-11-14 17:16:48,220 - INFO - Finished converting document 4_2024-03-04 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-02-28' --> 'data\processed_data\META\4_2024-02-28.md'
Converted 'data\edgar_documents\META\4_2024-02-29' --> 'data\processed_data\META\4_2024-02-29.md'
Converted 'data\edgar_documents\META\4_2024-03-04' --> 'data\processed_data\META\4_2024-03-04.md'


2025-11-14 17:16:48,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:48,284 - INFO - Going to convert document batch...
2025-11-14 17:16:48,285 - INFO - Processing document 4_2024-03-05
2025-11-14 17:16:48,308 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 17:16:48,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:48,376 - INFO - Going to convert document batch...
2025-11-14 17:16:48,377 - INFO - Processing document 4_2024-03-06
2025-11-14 17:16:48,459 - INFO - Finished converting document 4_2024-03-06 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2024-03-05' --> 'data\processed_data\META\4_2024-03-05.md'
Converted 'data\edgar_documents\META\4_2024-03-06' --> 'data\processed_data\META\4_2024-03-06.md'


2025-11-14 17:16:48,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:48,556 - INFO - Going to convert document batch...
2025-11-14 17:16:48,557 - INFO - Processing document 4_2024-03-07
2025-11-14 17:16:48,575 - INFO - Finished converting document 4_2024-03-07 in 0.06 sec.
2025-11-14 17:16:48,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:48,649 - INFO - Going to convert document batch...
2025-11-14 17:16:48,650 - INFO - Processing document 4_2024-03-11
2025-11-14 17:16:48,727 - INFO - Finished converting document 4_2024-03-11 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2024-03-07' --> 'data\processed_data\META\4_2024-03-07.md'


2025-11-14 17:16:48,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:48,810 - INFO - Going to convert document batch...
2025-11-14 17:16:48,812 - INFO - Processing document 4_2024-03-12
2025-11-14 17:16:48,834 - INFO - Finished converting document 4_2024-03-12 in 0.05 sec.
2025-11-14 17:16:48,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:48,900 - INFO - Going to convert document batch...
2025-11-14 17:16:48,901 - INFO - Processing document 4_2024-03-13
2025-11-14 17:16:48,986 - INFO - Finished converting document 4_2024-03-13 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2024-03-11' --> 'data\processed_data\META\4_2024-03-11.md'
Converted 'data\edgar_documents\META\4_2024-03-12' --> 'data\processed_data\META\4_2024-03-12.md'


2025-11-14 17:16:49,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:49,089 - INFO - Going to convert document batch...
2025-11-14 17:16:49,089 - INFO - Processing document 4_2024-03-14
2025-11-14 17:16:49,108 - INFO - Finished converting document 4_2024-03-14 in 0.06 sec.
2025-11-14 17:16:49,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:49,172 - INFO - Going to convert document batch...
2025-11-14 17:16:49,173 - INFO - Processing document 4_2024-03-18


Converted 'data\edgar_documents\META\4_2024-03-13' --> 'data\processed_data\META\4_2024-03-13.md'
Converted 'data\edgar_documents\META\4_2024-03-14' --> 'data\processed_data\META\4_2024-03-14.md'


2025-11-14 17:16:49,260 - INFO - Finished converting document 4_2024-03-18 in 0.14 sec.
2025-11-14 17:16:49,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:49,352 - INFO - Going to convert document batch...
2025-11-14 17:16:49,353 - INFO - Processing document 4_2024-03-19
2025-11-14 17:16:49,394 - INFO - Finished converting document 4_2024-03-19 in 0.06 sec.
2025-11-14 17:16:49,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:49,473 - INFO - Going to convert document batch...
2025-11-14 17:16:49,474 - INFO - Processing document 4_2024-03-20
2025-11-14 17:16:49,529 - INFO - Finished converting document 4_2024-03-20 in 0.11 sec.


Converted 'data\edgar_documents\META\4_2024-03-18' --> 'data\processed_data\META\4_2024-03-18.md'
Converted 'data\edgar_documents\META\4_2024-03-19' --> 'data\processed_data\META\4_2024-03-19.md'


2025-11-14 17:16:49,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:49,599 - INFO - Going to convert document batch...
2025-11-14 17:16:49,600 - INFO - Processing document 4_2024-03-21
2025-11-14 17:16:49,620 - INFO - Finished converting document 4_2024-03-21 in 0.05 sec.
2025-11-14 17:16:49,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:49,662 - INFO - Going to convert document batch...
2025-11-14 17:16:49,662 - INFO - Processing document 4_2024-03-22
2025-11-14 17:16:49,688 - INFO - Finished converting document 4_2024-03-22 in 0.05 sec.
2025-11-14 17:16:49,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:49,762 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2024-03-20' --> 'data\processed_data\META\4_2024-03-20.md'
Converted 'data\edgar_documents\META\4_2024-03-21' --> 'data\processed_data\META\4_2024-03-21.md'
Converted 'data\edgar_documents\META\4_2024-03-22' --> 'data\processed_data\META\4_2024-03-22.md'


2025-11-14 17:16:49,763 - INFO - Processing document 4_2024-03-25
2025-11-14 17:16:49,842 - INFO - Finished converting document 4_2024-03-25 in 0.12 sec.
2025-11-14 17:16:49,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:49,921 - INFO - Going to convert document batch...
2025-11-14 17:16:49,921 - INFO - Processing document 4_2024-03-26
2025-11-14 17:16:49,943 - INFO - Finished converting document 4_2024-03-26 in 0.05 sec.
2025-11-14 17:16:49,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:49,999 - INFO - Going to convert document batch...
2025-11-14 17:16:50,000 - INFO - Processing document 4_2024-03-27
2025-11-14 17:16:50,052 - INFO - Finished converting document 4_2024-03-27 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-03-25' --> 'data\processed_data\META\4_2024-03-25.md'
Converted 'data\edgar_documents\META\4_2024-03-26' --> 'data\processed_data\META\4_2024-03-26.md'
Converted 'data\edgar_documents\META\4_2024-03-27' --> 'data\processed_data\META\4_2024-03-27.md'


2025-11-14 17:16:50,121 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:50,146 - INFO - Going to convert document batch...
2025-11-14 17:16:50,146 - INFO - Processing document 4_2024-04-01
2025-11-14 17:16:50,190 - INFO - Finished converting document 4_2024-04-01 in 0.09 sec.
2025-11-14 17:16:50,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:50,278 - INFO - Going to convert document batch...
2025-11-14 17:16:50,278 - INFO - Processing document 4_2024-04-03
2025-11-14 17:16:50,299 - INFO - Finished converting document 4_2024-04-03 in 0.05 sec.
2025-11-14 17:16:50,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:50,341 - INFO - Going to convert document batch...
2025-11-14 17:16:50,341 - INFO - Processing document 4_2024-04-09
2025-11-14 17:16:50,364 - INFO - Finished converting document 4_2024-04-09 in 0.05 sec.
2025-11-14 17:16:50,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\META\4_2024-04-01' --> 'data\processed_data\META\4_2024-04-01.md'
Converted 'data\edgar_documents\META\4_2024-04-03' --> 'data\processed_data\META\4_2024-04-03.md'
Converted 'data\edgar_documents\META\4_2024-04-09' --> 'data\processed_data\META\4_2024-04-09.md'


2025-11-14 17:16:50,454 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:50,463 - INFO - Going to convert document batch...
2025-11-14 17:16:50,464 - INFO - Processing document 4_2024-04-16
2025-11-14 17:16:50,489 - INFO - Finished converting document 4_2024-04-16 in 0.05 sec.
2025-11-14 17:16:50,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:50,723 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2024-04-11' --> 'data\processed_data\META\4_2024-04-11.md'
Converted 'data\edgar_documents\META\4_2024-04-16' --> 'data\processed_data\META\4_2024-04-16.md'


2025-11-14 17:16:50,725 - INFO - Processing document 4_2024-04-18
2025-11-14 17:16:50,743 - INFO - Finished converting document 4_2024-04-18 in 0.22 sec.
2025-11-14 17:16:50,777 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:50,787 - INFO - Going to convert document batch...
2025-11-14 17:16:50,788 - INFO - Processing document 4_2024-04-23
2025-11-14 17:16:50,809 - INFO - Finished converting document 4_2024-04-23 in 0.05 sec.
2025-11-14 17:16:50,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:50,849 - INFO - Going to convert document batch...
2025-11-14 17:16:50,850 - INFO - Processing document 4_2024-04-25
2025-11-14 17:16:50,867 - INFO - Finished converting document 4_2024-04-25 in 0.03 sec.
2025-11-14 17:16:50,898 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:50,906 - INFO - Going to convert document batch...
2025-11-14 17:16:50,907 - INFO - Processing document 4_2024-04-30
2025-11-14 17:16:50,926 - IN

Converted 'data\edgar_documents\META\4_2024-04-18' --> 'data\processed_data\META\4_2024-04-18.md'
Converted 'data\edgar_documents\META\4_2024-04-23' --> 'data\processed_data\META\4_2024-04-23.md'
Converted 'data\edgar_documents\META\4_2024-04-25' --> 'data\processed_data\META\4_2024-04-25.md'


2025-11-14 17:16:50,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:50,991 - INFO - Going to convert document batch...
2025-11-14 17:16:50,993 - INFO - Processing document 4_2024-05-02
2025-11-14 17:16:51,018 - INFO - Finished converting document 4_2024-05-02 in 0.06 sec.
2025-11-14 17:16:51,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,061 - INFO - Going to convert document batch...
2025-11-14 17:16:51,062 - INFO - Processing document 4_2024-05-07
2025-11-14 17:16:51,083 - INFO - Finished converting document 4_2024-05-07 in 0.03 sec.
2025-11-14 17:16:51,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,124 - INFO - Going to convert document batch...
2025-11-14 17:16:51,125 - INFO - Processing document 4_2024-05-09
2025-11-14 17:16:51,143 - INFO - Finished converting document 4_2024-05-09 in 0.03 sec.


Converted 'data\edgar_documents\META\4_2024-04-30' --> 'data\processed_data\META\4_2024-04-30.md'
Converted 'data\edgar_documents\META\4_2024-05-02' --> 'data\processed_data\META\4_2024-05-02.md'
Converted 'data\edgar_documents\META\4_2024-05-07' --> 'data\processed_data\META\4_2024-05-07.md'


2025-11-14 17:16:51,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,184 - INFO - Going to convert document batch...
2025-11-14 17:16:51,185 - INFO - Processing document 4_2024-05-17
2025-11-14 17:16:51,211 - INFO - Finished converting document 4_2024-05-17 in 0.05 sec.
2025-11-14 17:16:51,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,256 - INFO - Going to convert document batch...
2025-11-14 17:16:51,257 - INFO - Processing document 4_2024-05-23
2025-11-14 17:16:51,275 - INFO - Finished converting document 4_2024-05-23 in 0.03 sec.
2025-11-14 17:16:51,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,314 - INFO - Going to convert document batch...
2025-11-14 17:16:51,314 - INFO - Processing document 4_2024-05-28
2025-11-14 17:16:51,335 - INFO - Finished converting document 4_2024-05-28 in 0.03 sec.


Converted 'data\edgar_documents\META\4_2024-05-09' --> 'data\processed_data\META\4_2024-05-09.md'
Converted 'data\edgar_documents\META\4_2024-05-17' --> 'data\processed_data\META\4_2024-05-17.md'
Converted 'data\edgar_documents\META\4_2024-05-23' --> 'data\processed_data\META\4_2024-05-23.md'


2025-11-14 17:16:51,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,422 - INFO - Going to convert document batch...
2025-11-14 17:16:51,423 - INFO - Processing document 4_2024-05-30
2025-11-14 17:16:51,441 - INFO - Finished converting document 4_2024-05-30 in 0.05 sec.
2025-11-14 17:16:51,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,491 - INFO - Going to convert document batch...
2025-11-14 17:16:51,492 - INFO - Processing document 4_2024-05-31
2025-11-14 17:16:51,532 - INFO - Finished converting document 4_2024-05-31 in 0.08 sec.
2025-11-14 17:16:51,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2024-05-28' --> 'data\processed_data\META\4_2024-05-28.md'
Converted 'data\edgar_documents\META\4_2024-05-30' --> 'data\processed_data\META\4_2024-05-30.md'
Converted 'data\edgar_documents\META\4_2024-05-31' --> 'data\processed_data\META\4_2024-05-31.md'


2025-11-14 17:16:51,588 - INFO - Going to convert document batch...
2025-11-14 17:16:51,589 - INFO - Processing document 4_2024-06-03
2025-11-14 17:16:51,609 - INFO - Finished converting document 4_2024-06-03 in 0.05 sec.
2025-11-14 17:16:51,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,651 - INFO - Going to convert document batch...
2025-11-14 17:16:51,652 - INFO - Processing document 4_2024-06-06
2025-11-14 17:16:51,674 - INFO - Finished converting document 4_2024-06-06 in 0.05 sec.
2025-11-14 17:16:51,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,717 - INFO - Going to convert document batch...
2025-11-14 17:16:51,717 - INFO - Processing document 4_2024-06-10
2025-11-14 17:16:51,757 - INFO - Finished converting document 4_2024-06-10 in 0.06 sec.
2025-11-14 17:16:51,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,828 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2024-06-03' --> 'data\processed_data\META\4_2024-06-03.md'
Converted 'data\edgar_documents\META\4_2024-06-06' --> 'data\processed_data\META\4_2024-06-06.md'
Converted 'data\edgar_documents\META\4_2024-06-10' --> 'data\processed_data\META\4_2024-06-10.md'


2025-11-14 17:16:51,829 - INFO - Processing document 4_2024-06-12
2025-11-14 17:16:51,891 - INFO - Finished converting document 4_2024-06-12 in 0.09 sec.
2025-11-14 17:16:51,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:51,959 - INFO - Going to convert document batch...
2025-11-14 17:16:51,960 - INFO - Processing document 4_2024-06-13
2025-11-14 17:16:51,977 - INFO - Finished converting document 4_2024-06-13 in 0.03 sec.
2025-11-14 17:16:52,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:52,029 - INFO - Going to convert document batch...
2025-11-14 17:16:52,030 - INFO - Processing document 4_2024-06-17
2025-11-14 17:16:52,081 - INFO - Finished converting document 4_2024-06-17 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-06-12' --> 'data\processed_data\META\4_2024-06-12.md'
Converted 'data\edgar_documents\META\4_2024-06-13' --> 'data\processed_data\META\4_2024-06-13.md'


2025-11-14 17:16:52,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:52,155 - INFO - Going to convert document batch...
2025-11-14 17:16:52,156 - INFO - Processing document 4_2024-06-20
2025-11-14 17:16:52,209 - INFO - Finished converting document 4_2024-06-20 in 0.08 sec.
2025-11-14 17:16:52,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:52,299 - INFO - Going to convert document batch...
2025-11-14 17:16:52,300 - INFO - Processing document 4_2024-06-24
2025-11-14 17:16:52,334 - INFO - Finished converting document 4_2024-06-24 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-06-17' --> 'data\processed_data\META\4_2024-06-17.md'
Converted 'data\edgar_documents\META\4_2024-06-20' --> 'data\processed_data\META\4_2024-06-20.md'


2025-11-14 17:16:52,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:52,401 - INFO - Going to convert document batch...
2025-11-14 17:16:52,401 - INFO - Processing document 4_2024-06-26
2025-11-14 17:16:52,482 - INFO - Finished converting document 4_2024-06-26 in 0.12 sec.
2025-11-14 17:16:52,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2024-06-24' --> 'data\processed_data\META\4_2024-06-24.md'
Converted 'data\edgar_documents\META\4_2024-06-26' --> 'data\processed_data\META\4_2024-06-26.md'


2025-11-14 17:16:52,550 - INFO - Going to convert document batch...
2025-11-14 17:16:52,551 - INFO - Processing document 4_2024-06-27
2025-11-14 17:16:52,569 - INFO - Finished converting document 4_2024-06-27 in 0.03 sec.
2025-11-14 17:16:52,605 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:52,641 - INFO - Going to convert document batch...
2025-11-14 17:16:52,642 - INFO - Processing document 4_2024-07-01
2025-11-14 17:16:52,739 - INFO - Finished converting document 4_2024-07-01 in 0.14 sec.


Converted 'data\edgar_documents\META\4_2024-06-27' --> 'data\processed_data\META\4_2024-06-27.md'


2025-11-14 17:16:52,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:52,856 - INFO - Going to convert document batch...
2025-11-14 17:16:52,857 - INFO - Processing document 4_2024-07-03
2025-11-14 17:16:52,913 - INFO - Finished converting document 4_2024-07-03 in 0.08 sec.
2025-11-14 17:16:52,968 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:52,997 - INFO - Going to convert document batch...
2025-11-14 17:16:52,997 - INFO - Processing document 4_2024-07-08


Converted 'data\edgar_documents\META\4_2024-07-01' --> 'data\processed_data\META\4_2024-07-01.md'
Converted 'data\edgar_documents\META\4_2024-07-03' --> 'data\processed_data\META\4_2024-07-03.md'


2025-11-14 17:16:53,071 - INFO - Finished converting document 4_2024-07-08 in 0.11 sec.
2025-11-14 17:16:53,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:53,152 - INFO - Going to convert document batch...
2025-11-14 17:16:53,154 - INFO - Processing document 4_2024-07-09
2025-11-14 17:16:53,176 - INFO - Finished converting document 4_2024-07-09 in 0.05 sec.
2025-11-14 17:16:53,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:53,234 - INFO - Going to convert document batch...
2025-11-14 17:16:53,235 - INFO - Processing document 4_2024-07-10
2025-11-14 17:16:53,298 - INFO - Finished converting document 4_2024-07-10 in 0.09 sec.


Converted 'data\edgar_documents\META\4_2024-07-08' --> 'data\processed_data\META\4_2024-07-08.md'
Converted 'data\edgar_documents\META\4_2024-07-09' --> 'data\processed_data\META\4_2024-07-09.md'


2025-11-14 17:16:53,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:53,390 - INFO - Going to convert document batch...
2025-11-14 17:16:53,391 - INFO - Processing document 4_2024-07-15
2025-11-14 17:16:53,451 - INFO - Finished converting document 4_2024-07-15 in 0.09 sec.
2025-11-14 17:16:53,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2024-07-10' --> 'data\processed_data\META\4_2024-07-10.md'
Converted 'data\edgar_documents\META\4_2024-07-15' --> 'data\processed_data\META\4_2024-07-15.md'


2025-11-14 17:16:53,560 - INFO - Going to convert document batch...
2025-11-14 17:16:53,561 - INFO - Processing document 4_2024-07-17
2025-11-14 17:16:53,804 - INFO - Finished converting document 4_2024-07-17 in 0.27 sec.
2025-11-14 17:16:53,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:53,878 - INFO - Going to convert document batch...
2025-11-14 17:16:53,879 - INFO - Processing document 4_2024-07-22
2025-11-14 17:16:53,899 - INFO - Finished converting document 4_2024-07-22 in 0.05 sec.
2025-11-14 17:16:53,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:53,963 - INFO - Going to convert document batch...
2025-11-14 17:16:53,964 - INFO - Processing document 4_2024-07-25
2025-11-14 17:16:53,983 - INFO - Finished converting document 4_2024-07-25 in 0.06 sec.
2025-11-14 17:16:54,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:54,024 - INFO - Going to convert document batch...
2025-11-14 17:16:54,025 - 

Converted 'data\edgar_documents\META\4_2024-07-17' --> 'data\processed_data\META\4_2024-07-17.md'
Converted 'data\edgar_documents\META\4_2024-07-22' --> 'data\processed_data\META\4_2024-07-22.md'
Converted 'data\edgar_documents\META\4_2024-07-25' --> 'data\processed_data\META\4_2024-07-25.md'


2025-11-14 17:16:54,047 - INFO - Finished converting document 4_2024-07-29 in 0.05 sec.
2025-11-14 17:16:54,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:54,090 - INFO - Going to convert document batch...
2025-11-14 17:16:54,091 - INFO - Processing document 4_2024-08-01
2025-11-14 17:16:54,109 - INFO - Finished converting document 4_2024-08-01 in 0.05 sec.
2025-11-14 17:16:54,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:54,180 - INFO - Going to convert document batch...
2025-11-14 17:16:54,181 - INFO - Processing document 4_2024-08-05
2025-11-14 17:16:54,228 - INFO - Finished converting document 4_2024-08-05 in 0.09 sec.


Converted 'data\edgar_documents\META\4_2024-07-29' --> 'data\processed_data\META\4_2024-07-29.md'
Converted 'data\edgar_documents\META\4_2024-08-01' --> 'data\processed_data\META\4_2024-08-01.md'


2025-11-14 17:16:54,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:54,297 - INFO - Going to convert document batch...
2025-11-14 17:16:54,298 - INFO - Processing document 4_2024-08-07
2025-11-14 17:16:54,362 - INFO - Finished converting document 4_2024-08-07 in 0.09 sec.
2025-11-14 17:16:54,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:54,456 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2024-08-05' --> 'data\processed_data\META\4_2024-08-05.md'
Converted 'data\edgar_documents\META\4_2024-08-07' --> 'data\processed_data\META\4_2024-08-07.md'


2025-11-14 17:16:54,457 - INFO - Processing document 4_2024-08-08
2025-11-14 17:16:54,477 - INFO - Finished converting document 4_2024-08-08 in 0.06 sec.
2025-11-14 17:16:54,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:54,536 - INFO - Going to convert document batch...
2025-11-14 17:16:54,537 - INFO - Processing document 4_2024-08-12
2025-11-14 17:16:54,608 - INFO - Finished converting document 4_2024-08-12 in 0.11 sec.
2025-11-14 17:16:54,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:54,700 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2024-08-08' --> 'data\processed_data\META\4_2024-08-08.md'
Converted 'data\edgar_documents\META\4_2024-08-12' --> 'data\processed_data\META\4_2024-08-12.md'


2025-11-14 17:16:54,701 - INFO - Processing document 4_2024-08-14
2025-11-14 17:16:54,798 - INFO - Finished converting document 4_2024-08-14 in 0.14 sec.
2025-11-14 17:16:54,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:54,877 - INFO - Going to convert document batch...
2025-11-14 17:16:54,878 - INFO - Processing document 4_2024-08-19
2025-11-14 17:16:54,898 - INFO - Finished converting document 4_2024-08-19 in 0.03 sec.
2025-11-14 17:16:54,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:54,982 - INFO - Going to convert document batch...
2025-11-14 17:16:54,983 - INFO - Processing document 4_2024-08-21
2025-11-14 17:16:55,054 - INFO - Finished converting document 4_2024-08-21 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2024-08-14' --> 'data\processed_data\META\4_2024-08-14.md'
Converted 'data\edgar_documents\META\4_2024-08-19' --> 'data\processed_data\META\4_2024-08-19.md'


2025-11-14 17:16:55,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:55,132 - INFO - Going to convert document batch...
2025-11-14 17:16:55,133 - INFO - Processing document 4_2024-08-22
2025-11-14 17:16:55,154 - INFO - Finished converting document 4_2024-08-22 in 0.05 sec.
2025-11-14 17:16:55,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:55,217 - INFO - Going to convert document batch...
2025-11-14 17:16:55,217 - INFO - Processing document 4_2024-08-26
2025-11-14 17:16:55,296 - INFO - Finished converting document 4_2024-08-26 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2024-08-21' --> 'data\processed_data\META\4_2024-08-21.md'
Converted 'data\edgar_documents\META\4_2024-08-22' --> 'data\processed_data\META\4_2024-08-22.md'


2025-11-14 17:16:55,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:55,395 - INFO - Going to convert document batch...
2025-11-14 17:16:55,396 - INFO - Processing document 4_2024-08-27
2025-11-14 17:16:55,422 - INFO - Finished converting document 4_2024-08-27 in 0.06 sec.
2025-11-14 17:16:55,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:55,491 - INFO - Going to convert document batch...
2025-11-14 17:16:55,492 - INFO - Processing document 4_2024-08-28
2025-11-14 17:16:55,533 - INFO - Finished converting document 4_2024-08-28 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-08-26' --> 'data\processed_data\META\4_2024-08-26.md'
Converted 'data\edgar_documents\META\4_2024-08-27' --> 'data\processed_data\META\4_2024-08-27.md'


2025-11-14 17:16:55,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:55,602 - INFO - Going to convert document batch...
2025-11-14 17:16:55,603 - INFO - Processing document 4_2024-08-29
2025-11-14 17:16:55,648 - INFO - Finished converting document 4_2024-08-29 in 0.06 sec.
2025-11-14 17:16:55,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:55,719 - INFO - Going to convert document batch...
2025-11-14 17:16:55,720 - INFO - Processing document 4_2024-09-03
2025-11-14 17:16:55,763 - INFO - Finished converting document 4_2024-09-03 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-08-28' --> 'data\processed_data\META\4_2024-08-28.md'
Converted 'data\edgar_documents\META\4_2024-08-29' --> 'data\processed_data\META\4_2024-08-29.md'


2025-11-14 17:16:55,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:55,823 - INFO - Going to convert document batch...
2025-11-14 17:16:55,825 - INFO - Processing document 4_2024-09-04
2025-11-14 17:16:55,863 - INFO - Finished converting document 4_2024-09-04 in 0.06 sec.
2025-11-14 17:16:55,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:55,914 - INFO - Going to convert document batch...
2025-11-14 17:16:55,915 - INFO - Processing document 4_2024-09-05
2025-11-14 17:16:55,933 - INFO - Finished converting document 4_2024-09-05 in 0.05 sec.
2025-11-14 17:16:55,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:55,975 - INFO - Going to convert document batch...
2025-11-14 17:16:55,976 - INFO - Processing document 4_2024-09-10
2025-11-14 17:16:55,998 - INFO - Finished converting document 4_2024-09-10 in 0.05 sec.


Converted 'data\edgar_documents\META\4_2024-09-03' --> 'data\processed_data\META\4_2024-09-03.md'
Converted 'data\edgar_documents\META\4_2024-09-04' --> 'data\processed_data\META\4_2024-09-04.md'
Converted 'data\edgar_documents\META\4_2024-09-05' --> 'data\processed_data\META\4_2024-09-05.md'


2025-11-14 17:16:56,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,042 - INFO - Going to convert document batch...
2025-11-14 17:16:56,043 - INFO - Processing document 4_2024-09-12
2025-11-14 17:16:56,060 - INFO - Finished converting document 4_2024-09-12 in 0.05 sec.
2025-11-14 17:16:56,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,122 - INFO - Going to convert document batch...
2025-11-14 17:16:56,123 - INFO - Processing document 4_2024-09-17
2025-11-14 17:16:56,142 - INFO - Finished converting document 4_2024-09-17 in 0.06 sec.
2025-11-14 17:16:56,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,208 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2024-09-10' --> 'data\processed_data\META\4_2024-09-10.md'
Converted 'data\edgar_documents\META\4_2024-09-12' --> 'data\processed_data\META\4_2024-09-12.md'
Converted 'data\edgar_documents\META\4_2024-09-17' --> 'data\processed_data\META\4_2024-09-17.md'


2025-11-14 17:16:56,209 - INFO - Processing document 4_2024-09-19
2025-11-14 17:16:56,225 - INFO - Finished converting document 4_2024-09-19 in 0.06 sec.
2025-11-14 17:16:56,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,269 - INFO - Going to convert document batch...
2025-11-14 17:16:56,270 - INFO - Processing document 4_2024-09-23
2025-11-14 17:16:56,292 - INFO - Finished converting document 4_2024-09-23 in 0.05 sec.
2025-11-14 17:16:56,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,336 - INFO - Going to convert document batch...
2025-11-14 17:16:56,337 - INFO - Processing document 4_2024-09-24
2025-11-14 17:16:56,359 - INFO - Finished converting document 4_2024-09-24 in 0.05 sec.
2025-11-14 17:16:56,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,400 - INFO - Going to convert document batch...
2025-11-14 17:16:56,401 - INFO - Processing document 4_2024-09-25
2025-11-14 17:16:56,420 - IN

Converted 'data\edgar_documents\META\4_2024-09-19' --> 'data\processed_data\META\4_2024-09-19.md'
Converted 'data\edgar_documents\META\4_2024-09-23' --> 'data\processed_data\META\4_2024-09-23.md'
Converted 'data\edgar_documents\META\4_2024-09-24' --> 'data\processed_data\META\4_2024-09-24.md'
Converted 'data\edgar_documents\META\4_2024-09-25' --> 'data\processed_data\META\4_2024-09-25.md'


2025-11-14 17:16:56,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,480 - INFO - Going to convert document batch...
2025-11-14 17:16:56,481 - INFO - Processing document 4_2024-09-26
2025-11-14 17:16:56,498 - INFO - Finished converting document 4_2024-09-26 in 0.06 sec.
2025-11-14 17:16:56,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,541 - INFO - Going to convert document batch...
2025-11-14 17:16:56,542 - INFO - Processing document 4_2024-10-01
2025-11-14 17:16:56,563 - INFO - Finished converting document 4_2024-10-01 in 0.05 sec.
2025-11-14 17:16:56,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,625 - INFO - Going to convert document batch...
2025-11-14 17:16:56,626 - INFO - Processing document 4_2024-10-03
2025-11-14 17:16:56,644 - INFO - Finished converting document 4_2024-10-03 in 0.06 sec.
2025-11-14 17:16:56,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\META\4_2024-09-26' --> 'data\processed_data\META\4_2024-09-26.md'
Converted 'data\edgar_documents\META\4_2024-10-01' --> 'data\processed_data\META\4_2024-10-01.md'
Converted 'data\edgar_documents\META\4_2024-10-03' --> 'data\processed_data\META\4_2024-10-03.md'


2025-11-14 17:16:56,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,753 - INFO - Going to convert document batch...
2025-11-14 17:16:56,754 - INFO - Processing document 4_2024-10-09
2025-11-14 17:16:56,790 - INFO - Finished converting document 4_2024-10-09 in 0.05 sec.
2025-11-14 17:16:56,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:56,844 - INFO - Going to convert document batch...
2025-11-14 17:16:56,845 - INFO - Processing document 4_2024-10-10
2025-11-14 17:16:56,863 - INFO - Finished converting document 4_2024-10-10 in 0.05 sec.
2025-11-14 17:16:56,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2024-10-08' --> 'data\processed_data\META\4_2024-10-08.md'
Converted 'data\edgar_documents\META\4_2024-10-09' --> 'data\processed_data\META\4_2024-10-09.md'
Converted 'data\edgar_documents\META\4_2024-10-10' --> 'data\processed_data\META\4_2024-10-10.md'


2025-11-14 17:16:56,943 - INFO - Going to convert document batch...
2025-11-14 17:16:56,943 - INFO - Processing document 4_2024-10-15
2025-11-14 17:16:57,179 - INFO - Finished converting document 4_2024-10-15 in 0.27 sec.
2025-11-14 17:16:57,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:57,222 - INFO - Going to convert document batch...
2025-11-14 17:16:57,223 - INFO - Processing document 4_2024-10-16
2025-11-14 17:16:57,254 - INFO - Finished converting document 4_2024-10-16 in 0.05 sec.
2025-11-14 17:16:57,296 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:57,303 - INFO - Going to convert document batch...
2025-11-14 17:16:57,304 - INFO - Processing document 4_2024-10-17
2025-11-14 17:16:57,322 - INFO - Finished converting document 4_2024-10-17 in 0.05 sec.
2025-11-14 17:16:57,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:57,362 - INFO - Going to convert document batch...
2025-11-14 17:16:57,364 - 

Converted 'data\edgar_documents\META\4_2024-10-15' --> 'data\processed_data\META\4_2024-10-15.md'
Converted 'data\edgar_documents\META\4_2024-10-16' --> 'data\processed_data\META\4_2024-10-16.md'
Converted 'data\edgar_documents\META\4_2024-10-17' --> 'data\processed_data\META\4_2024-10-17.md'


2025-11-14 17:16:57,419 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:57,427 - INFO - Going to convert document batch...
2025-11-14 17:16:57,428 - INFO - Processing document 4_2024-10-24
2025-11-14 17:16:57,446 - INFO - Finished converting document 4_2024-10-24 in 0.03 sec.
2025-11-14 17:16:57,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:57,489 - INFO - Going to convert document batch...
2025-11-14 17:16:57,490 - INFO - Processing document 4_2024-10-29
2025-11-14 17:16:57,531 - INFO - Finished converting document 4_2024-10-29 in 0.06 sec.
2025-11-14 17:16:57,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:57,598 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2024-10-22' --> 'data\processed_data\META\4_2024-10-22.md'
Converted 'data\edgar_documents\META\4_2024-10-24' --> 'data\processed_data\META\4_2024-10-24.md'
Converted 'data\edgar_documents\META\4_2024-10-29' --> 'data\processed_data\META\4_2024-10-29.md'


2025-11-14 17:16:57,599 - INFO - Processing document 4_2024-10-30
2025-11-14 17:16:57,623 - INFO - Finished converting document 4_2024-10-30 in 0.06 sec.
2025-11-14 17:16:57,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:57,675 - INFO - Going to convert document batch...
2025-11-14 17:16:57,676 - INFO - Processing document 4_2024-10-31
2025-11-14 17:16:57,704 - INFO - Finished converting document 4_2024-10-31 in 0.05 sec.
2025-11-14 17:16:57,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:57,780 - INFO - Going to convert document batch...
2025-11-14 17:16:57,781 - INFO - Processing document 4_2024-11-01
2025-11-14 17:16:57,812 - INFO - Finished converting document 4_2024-11-01 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-10-30' --> 'data\processed_data\META\4_2024-10-30.md'
Converted 'data\edgar_documents\META\4_2024-10-31' --> 'data\processed_data\META\4_2024-10-31.md'
Converted 'data\edgar_documents\META\4_2024-11-01' --> 'data\processed_data\META\4_2024-11-01.md'


2025-11-14 17:16:57,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:57,897 - INFO - Going to convert document batch...
2025-11-14 17:16:57,899 - INFO - Processing document 4_2024-11-05
2025-11-14 17:16:57,962 - INFO - Finished converting document 4_2024-11-05 in 0.11 sec.
2025-11-14 17:16:58,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:58,041 - INFO - Going to convert document batch...
2025-11-14 17:16:58,042 - INFO - Processing document 4_2024-11-07
2025-11-14 17:16:58,066 - INFO - Finished converting document 4_2024-11-07 in 0.05 sec.
2025-11-14 17:16:58,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:58,126 - INFO - Going to convert document batch...
2025-11-14 17:16:58,127 - INFO - Processing document 4_2024-11-19
2025-11-14 17:16:58,167 - INFO - Finished converting document 4_2024-11-19 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-11-05' --> 'data\processed_data\META\4_2024-11-05.md'
Converted 'data\edgar_documents\META\4_2024-11-07' --> 'data\processed_data\META\4_2024-11-07.md'


2025-11-14 17:16:58,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:58,224 - INFO - Going to convert document batch...
2025-11-14 17:16:58,225 - INFO - Processing document 4_2024-11-21
2025-11-14 17:16:58,243 - INFO - Finished converting document 4_2024-11-21 in 0.03 sec.
2025-11-14 17:16:58,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:58,290 - INFO - Going to convert document batch...
2025-11-14 17:16:58,291 - INFO - Processing document 4_2024-11-26
2025-11-14 17:16:58,313 - INFO - Finished converting document 4_2024-11-26 in 0.05 sec.
2025-11-14 17:16:58,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:58,361 - INFO - Going to convert document batch...
2025-11-14 17:16:58,362 - INFO - Processing document 4_2024-11-27
2025-11-14 17:16:58,380 - INFO - Finished converting document 4_2024-11-27 in 0.03 sec.


Converted 'data\edgar_documents\META\4_2024-11-19' --> 'data\processed_data\META\4_2024-11-19.md'
Converted 'data\edgar_documents\META\4_2024-11-21' --> 'data\processed_data\META\4_2024-11-21.md'
Converted 'data\edgar_documents\META\4_2024-11-26' --> 'data\processed_data\META\4_2024-11-26.md'
Converted 'data\edgar_documents\META\4_2024-11-27' --> 'data\processed_data\META\4_2024-11-27.md'


2025-11-14 17:16:58,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:58,463 - INFO - Going to convert document batch...
2025-11-14 17:16:58,464 - INFO - Processing document 4_2024-12-04
2025-11-14 17:16:58,548 - INFO - Finished converting document 4_2024-12-04 in 0.14 sec.
2025-11-14 17:16:58,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:58,627 - INFO - Going to convert document batch...
2025-11-14 17:16:58,628 - INFO - Processing document 4_2024-12-05
2025-11-14 17:16:58,645 - INFO - Finished converting document 4_2024-12-05 in 0.03 sec.
2025-11-14 17:16:58,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:58,702 - INFO - Going to convert document batch...
2025-11-14 17:16:58,703 - INFO - Processing document 4_2024-12-09
2025-11-14 17:16:58,771 - INFO - Finished converting document 4_2024-12-09 in 0.11 sec.


Converted 'data\edgar_documents\META\4_2024-12-04' --> 'data\processed_data\META\4_2024-12-04.md'
Converted 'data\edgar_documents\META\4_2024-12-05' --> 'data\processed_data\META\4_2024-12-05.md'
Converted 'data\edgar_documents\META\4_2024-12-09' --> 'data\processed_data\META\4_2024-12-09.md'


2025-11-14 17:16:58,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:58,907 - INFO - Going to convert document batch...
2025-11-14 17:16:58,909 - INFO - Processing document 4_2024-12-11
2025-11-14 17:16:59,011 - INFO - Finished converting document 4_2024-12-11 in 0.19 sec.
2025-11-14 17:16:59,097 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:59,104 - INFO - Going to convert document batch...
2025-11-14 17:16:59,105 - INFO - Processing document 4_2024-12-12
2025-11-14 17:16:59,123 - INFO - Finished converting document 4_2024-12-12 in 0.05 sec.
2025-11-14 17:16:59,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:59,195 - INFO - Going to convert document batch...
2025-11-14 17:16:59,196 - INFO - Processing document 4_2024-12-16


Converted 'data\edgar_documents\META\4_2024-12-11' --> 'data\processed_data\META\4_2024-12-11.md'
Converted 'data\edgar_documents\META\4_2024-12-12' --> 'data\processed_data\META\4_2024-12-12.md'


2025-11-14 17:16:59,286 - INFO - Finished converting document 4_2024-12-16 in 0.14 sec.
2025-11-14 17:16:59,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:59,424 - INFO - Going to convert document batch...
2025-11-14 17:16:59,425 - INFO - Processing document 4_2024-12-18
2025-11-14 17:16:59,508 - INFO - Finished converting document 4_2024-12-18 in 0.14 sec.


Converted 'data\edgar_documents\META\4_2024-12-16' --> 'data\processed_data\META\4_2024-12-16.md'


2025-11-14 17:16:59,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:59,594 - INFO - Going to convert document batch...
2025-11-14 17:16:59,595 - INFO - Processing document 4_2024-12-19
2025-11-14 17:16:59,614 - INFO - Finished converting document 4_2024-12-19 in 0.05 sec.
2025-11-14 17:16:59,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:59,673 - INFO - Going to convert document batch...
2025-11-14 17:16:59,674 - INFO - Processing document 4_2024-12-23
2025-11-14 17:16:59,721 - INFO - Finished converting document 4_2024-12-23 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-12-18' --> 'data\processed_data\META\4_2024-12-18.md'
Converted 'data\edgar_documents\META\4_2024-12-19' --> 'data\processed_data\META\4_2024-12-19.md'


2025-11-14 17:16:59,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:59,817 - INFO - Going to convert document batch...
2025-11-14 17:16:59,819 - INFO - Processing document 4_2024-12-26
2025-11-14 17:16:59,857 - INFO - Finished converting document 4_2024-12-26 in 0.11 sec.
2025-11-14 17:16:59,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:16:59,910 - INFO - Going to convert document batch...
2025-11-14 17:16:59,911 - INFO - Processing document 4_2024-12-30
2025-11-14 17:16:59,954 - INFO - Finished converting document 4_2024-12-30 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2024-12-23' --> 'data\processed_data\META\4_2024-12-23.md'
Converted 'data\edgar_documents\META\4_2024-12-26' --> 'data\processed_data\META\4_2024-12-26.md'


2025-11-14 17:17:00,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:00,011 - INFO - Going to convert document batch...
2025-11-14 17:17:00,012 - INFO - Processing document 4_2025-01-02
2025-11-14 17:17:00,036 - INFO - Finished converting document 4_2025-01-02 in 0.05 sec.
2025-11-14 17:17:00,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:00,117 - INFO - Going to convert document batch...
2025-11-14 17:17:00,119 - INFO - Processing document 4_2025-01-06


Converted 'data\edgar_documents\META\4_2024-12-30' --> 'data\processed_data\META\4_2024-12-30.md'
Converted 'data\edgar_documents\META\4_2025-01-02' --> 'data\processed_data\META\4_2025-01-02.md'


2025-11-14 17:17:00,195 - INFO - Finished converting document 4_2025-01-06 in 0.14 sec.
2025-11-14 17:17:00,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2025-01-06' --> 'data\processed_data\META\4_2025-01-06.md'


2025-11-14 17:17:00,504 - INFO - Going to convert document batch...
2025-11-14 17:17:00,505 - INFO - Processing document 4_2025-01-08
2025-11-14 17:17:00,580 - INFO - Finished converting document 4_2025-01-08 in 0.33 sec.
2025-11-14 17:17:00,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:00,660 - INFO - Going to convert document batch...
2025-11-14 17:17:00,660 - INFO - Processing document 4_2025-01-10
2025-11-14 17:17:00,677 - INFO - Finished converting document 4_2025-01-10 in 0.03 sec.
2025-11-14 17:17:00,707 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:00,738 - INFO - Going to convert document batch...
2025-11-14 17:17:00,739 - INFO - Processing document 4_2025-01-13
2025-11-14 17:17:00,820 - INFO - Finished converting document 4_2025-01-13 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2025-01-08' --> 'data\processed_data\META\4_2025-01-08.md'
Converted 'data\edgar_documents\META\4_2025-01-10' --> 'data\processed_data\META\4_2025-01-10.md'


2025-11-14 17:17:00,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:00,975 - INFO - Going to convert document batch...
2025-11-14 17:17:00,976 - INFO - Processing document 4_2025-01-15
2025-11-14 17:17:01,070 - INFO - Finished converting document 4_2025-01-15 in 0.14 sec.


Converted 'data\edgar_documents\META\4_2025-01-13' --> 'data\processed_data\META\4_2025-01-13.md'


2025-11-14 17:17:01,158 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:01,166 - INFO - Going to convert document batch...
2025-11-14 17:17:01,168 - INFO - Processing document 4_2025-01-16
2025-11-14 17:17:01,185 - INFO - Finished converting document 4_2025-01-16 in 0.05 sec.
2025-11-14 17:17:01,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:01,250 - INFO - Going to convert document batch...
2025-11-14 17:17:01,251 - INFO - Processing document 4_2025-01-17
2025-11-14 17:17:01,280 - INFO - Finished converting document 4_2025-01-17 in 0.08 sec.
2025-11-14 17:17:01,329 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2025-01-15' --> 'data\processed_data\META\4_2025-01-15.md'
Converted 'data\edgar_documents\META\4_2025-01-16' --> 'data\processed_data\META\4_2025-01-16.md'
Converted 'data\edgar_documents\META\4_2025-01-17' --> 'data\processed_data\META\4_2025-01-17.md'


2025-11-14 17:17:01,368 - INFO - Going to convert document batch...
2025-11-14 17:17:01,369 - INFO - Processing document 4_2025-01-21
2025-11-14 17:17:01,471 - INFO - Finished converting document 4_2025-01-21 in 0.17 sec.


Converted 'data\edgar_documents\META\4_2025-01-21' --> 'data\processed_data\META\4_2025-01-21.md'


2025-11-14 17:17:01,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:01,790 - INFO - Going to convert document batch...
2025-11-14 17:17:01,791 - INFO - Processing document 4_2025-01-22
2025-11-14 17:17:01,874 - INFO - Finished converting document 4_2025-01-22 in 0.34 sec.
2025-11-14 17:17:01,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:01,959 - INFO - Going to convert document batch...
2025-11-14 17:17:01,960 - INFO - Processing document 4_2025-01-23
2025-11-14 17:17:01,982 - INFO - Finished converting document 4_2025-01-23 in 0.05 sec.
2025-11-14 17:17:02,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:02,064 - INFO - Going to convert document batch...
2025-11-14 17:17:02,065 - INFO - Processing document 4_2025-01-27


Converted 'data\edgar_documents\META\4_2025-01-22' --> 'data\processed_data\META\4_2025-01-22.md'
Converted 'data\edgar_documents\META\4_2025-01-23' --> 'data\processed_data\META\4_2025-01-23.md'


2025-11-14 17:17:02,155 - INFO - Finished converting document 4_2025-01-27 in 0.16 sec.
2025-11-14 17:17:02,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:02,276 - INFO - Going to convert document batch...
2025-11-14 17:17:02,277 - INFO - Processing document 4_2025-01-29
2025-11-14 17:17:02,403 - INFO - Finished converting document 4_2025-01-29 in 0.17 sec.


Converted 'data\edgar_documents\META\4_2025-01-27' --> 'data\processed_data\META\4_2025-01-27.md'


2025-11-14 17:17:02,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:02,497 - INFO - Going to convert document batch...
2025-11-14 17:17:02,500 - INFO - Processing document 4_2025-01-30
2025-11-14 17:17:02,532 - INFO - Finished converting document 4_2025-01-30 in 0.06 sec.
2025-11-14 17:17:02,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:02,601 - INFO - Going to convert document batch...
2025-11-14 17:17:02,603 - INFO - Processing document 4_2025-02-03
2025-11-14 17:17:02,673 - INFO - Finished converting document 4_2025-02-03 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2025-01-29' --> 'data\processed_data\META\4_2025-01-29.md'
Converted 'data\edgar_documents\META\4_2025-01-30' --> 'data\processed_data\META\4_2025-01-30.md'


2025-11-14 17:17:02,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:02,787 - INFO - Going to convert document batch...
2025-11-14 17:17:02,788 - INFO - Processing document 4_2025-02-05
2025-11-14 17:17:02,862 - INFO - Finished converting document 4_2025-02-05 in 0.12 sec.
2025-11-14 17:17:02,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2025-02-03' --> 'data\processed_data\META\4_2025-02-03.md'
Converted 'data\edgar_documents\META\4_2025-02-05' --> 'data\processed_data\META\4_2025-02-05.md'


2025-11-14 17:17:02,933 - INFO - Going to convert document batch...
2025-11-14 17:17:02,934 - INFO - Processing document 4_2025-02-06
2025-11-14 17:17:02,952 - INFO - Finished converting document 4_2025-02-06 in 0.05 sec.
2025-11-14 17:17:02,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:03,020 - INFO - Going to convert document batch...
2025-11-14 17:17:03,021 - INFO - Processing document 4_2025-02-10
2025-11-14 17:17:03,117 - INFO - Finished converting document 4_2025-02-10 in 0.14 sec.


Converted 'data\edgar_documents\META\4_2025-02-06' --> 'data\processed_data\META\4_2025-02-06.md'


2025-11-14 17:17:03,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:03,227 - INFO - Going to convert document batch...
2025-11-14 17:17:03,228 - INFO - Processing document 4_2025-02-12
2025-11-14 17:17:03,292 - INFO - Finished converting document 4_2025-02-12 in 0.11 sec.
2025-11-14 17:17:03,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:03,357 - INFO - Going to convert document batch...
2025-11-14 17:17:03,357 - INFO - Processing document 4_2025-02-13


Converted 'data\edgar_documents\META\4_2025-02-10' --> 'data\processed_data\META\4_2025-02-10.md'
Converted 'data\edgar_documents\META\4_2025-02-12' --> 'data\processed_data\META\4_2025-02-12.md'


2025-11-14 17:17:03,375 - INFO - Finished converting document 4_2025-02-13 in 0.03 sec.
2025-11-14 17:17:03,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2025-02-13' --> 'data\processed_data\META\4_2025-02-13.md'


2025-11-14 17:17:03,665 - INFO - Going to convert document batch...
2025-11-14 17:17:03,666 - INFO - Processing document 4_2025-02-18
2025-11-14 17:17:03,733 - INFO - Finished converting document 4_2025-02-18 in 0.34 sec.
2025-11-14 17:17:03,816 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:03,842 - INFO - Going to convert document batch...
2025-11-14 17:17:03,843 - INFO - Processing document 4_2025-02-19
2025-11-14 17:17:03,893 - INFO - Finished converting document 4_2025-02-19 in 0.11 sec.
2025-11-14 17:17:03,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:03,971 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2025-02-18' --> 'data\processed_data\META\4_2025-02-18.md'
Converted 'data\edgar_documents\META\4_2025-02-19' --> 'data\processed_data\META\4_2025-02-19.md'


2025-11-14 17:17:03,972 - INFO - Processing document 4_2025-02-24
2025-11-14 17:17:04,017 - INFO - Finished converting document 4_2025-02-24 in 0.08 sec.
2025-11-14 17:17:04,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,079 - INFO - Going to convert document batch...
2025-11-14 17:17:04,080 - INFO - Processing document 4_2025-02-26
2025-11-14 17:17:04,101 - INFO - Finished converting document 4_2025-02-26 in 0.03 sec.
2025-11-14 17:17:04,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,140 - INFO - Going to convert document batch...
2025-11-14 17:17:04,141 - INFO - Processing document 4_2025-02-27
2025-11-14 17:17:04,159 - INFO - Finished converting document 4_2025-02-27 in 0.03 sec.
2025-11-14 17:17:04,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,207 - INFO - Going to convert document batch...
2025-11-14 17:17:04,208 - INFO - Processing document 4_2025-02-28
2025-11-14 17:17:04,253 - IN

Converted 'data\edgar_documents\META\4_2025-02-24' --> 'data\processed_data\META\4_2025-02-24.md'
Converted 'data\edgar_documents\META\4_2025-02-26' --> 'data\processed_data\META\4_2025-02-26.md'
Converted 'data\edgar_documents\META\4_2025-02-27' --> 'data\processed_data\META\4_2025-02-27.md'


2025-11-14 17:17:04,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,329 - INFO - Going to convert document batch...
2025-11-14 17:17:04,330 - INFO - Processing document 4_2025-03-03
2025-11-14 17:17:04,414 - INFO - Finished converting document 4_2025-03-03 in 0.12 sec.


Converted 'data\edgar_documents\META\4_2025-02-28' --> 'data\processed_data\META\4_2025-02-28.md'


2025-11-14 17:17:04,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,507 - INFO - Going to convert document batch...
2025-11-14 17:17:04,508 - INFO - Processing document 4_2025-03-04
2025-11-14 17:17:04,554 - INFO - Finished converting document 4_2025-03-04 in 0.08 sec.
2025-11-14 17:17:04,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,647 - INFO - Going to convert document batch...
2025-11-14 17:17:04,648 - INFO - Processing document 4_2025-03-05
2025-11-14 17:17:04,670 - INFO - Finished converting document 4_2025-03-05 in 0.06 sec.


Converted 'data\edgar_documents\META\4_2025-03-03' --> 'data\processed_data\META\4_2025-03-03.md'
Converted 'data\edgar_documents\META\4_2025-03-04' --> 'data\processed_data\META\4_2025-03-04.md'


2025-11-14 17:17:04,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,711 - INFO - Going to convert document batch...
2025-11-14 17:17:04,712 - INFO - Processing document 4_2025-03-06
2025-11-14 17:17:04,732 - INFO - Finished converting document 4_2025-03-06 in 0.05 sec.
2025-11-14 17:17:04,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,778 - INFO - Going to convert document batch...
2025-11-14 17:17:04,779 - INFO - Processing document 4_2025-03-12
2025-11-14 17:17:04,803 - INFO - Finished converting document 4_2025-03-12 in 0.05 sec.
2025-11-14 17:17:04,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,845 - INFO - Going to convert document batch...
2025-11-14 17:17:04,845 - INFO - Processing document 4_2025-03-13
2025-11-14 17:17:04,863 - INFO - Finished converting document 4_2025-03-13 in 0.03 sec.


Converted 'data\edgar_documents\META\4_2025-03-05' --> 'data\processed_data\META\4_2025-03-05.md'
Converted 'data\edgar_documents\META\4_2025-03-06' --> 'data\processed_data\META\4_2025-03-06.md'
Converted 'data\edgar_documents\META\4_2025-03-12' --> 'data\processed_data\META\4_2025-03-12.md'


2025-11-14 17:17:04,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,902 - INFO - Going to convert document batch...
2025-11-14 17:17:04,903 - INFO - Processing document 4_2025-03-19
2025-11-14 17:17:04,926 - INFO - Finished converting document 4_2025-03-19 in 0.05 sec.
2025-11-14 17:17:04,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:04,971 - INFO - Going to convert document batch...
2025-11-14 17:17:04,972 - INFO - Processing document 4_2025-03-20
2025-11-14 17:17:04,993 - INFO - Finished converting document 4_2025-03-20 in 0.03 sec.
2025-11-14 17:17:05,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,029 - INFO - Going to convert document batch...
2025-11-14 17:17:05,030 - INFO - Processing document 4_2025-03-24
2025-11-14 17:17:05,050 - INFO - Finished converting document 4_2025-03-24 in 0.03 sec.
2025-11-14 17:17:05,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2025-03-13' --> 'data\processed_data\META\4_2025-03-13.md'
Converted 'data\edgar_documents\META\4_2025-03-19' --> 'data\processed_data\META\4_2025-03-19.md'
Converted 'data\edgar_documents\META\4_2025-03-20' --> 'data\processed_data\META\4_2025-03-20.md'
Converted 'data\edgar_documents\META\4_2025-03-24' --> 'data\processed_data\META\4_2025-03-24.md'


2025-11-14 17:17:05,092 - INFO - Going to convert document batch...
2025-11-14 17:17:05,093 - INFO - Processing document 4_2025-03-26
2025-11-14 17:17:05,115 - INFO - Finished converting document 4_2025-03-26 in 0.05 sec.
2025-11-14 17:17:05,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,173 - INFO - Going to convert document batch...
2025-11-14 17:17:05,173 - INFO - Processing document 4_2025-03-27
2025-11-14 17:17:05,190 - INFO - Finished converting document 4_2025-03-27 in 0.05 sec.
2025-11-14 17:17:05,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,230 - INFO - Going to convert document batch...
2025-11-14 17:17:05,231 - INFO - Processing document 4_2025-04-02
2025-11-14 17:17:05,253 - INFO - Finished converting document 4_2025-04-02 in 0.05 sec.
2025-11-14 17:17:05,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,293 - INFO - Going to convert document batch...
2025-11-14 17:17:05,294 - 

Converted 'data\edgar_documents\META\4_2025-03-26' --> 'data\processed_data\META\4_2025-03-26.md'
Converted 'data\edgar_documents\META\4_2025-03-27' --> 'data\processed_data\META\4_2025-03-27.md'
Converted 'data\edgar_documents\META\4_2025-04-02' --> 'data\processed_data\META\4_2025-04-02.md'
Converted 'data\edgar_documents\META\4_2025-04-03' --> 'data\processed_data\META\4_2025-04-03.md'


2025-11-14 17:17:05,353 - INFO - Going to convert document batch...
2025-11-14 17:17:05,354 - INFO - Processing document 4_2025-04-09
2025-11-14 17:17:05,377 - INFO - Finished converting document 4_2025-04-09 in 0.05 sec.
2025-11-14 17:17:05,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,439 - INFO - Going to convert document batch...
2025-11-14 17:17:05,440 - INFO - Processing document 4_2025-04-10
2025-11-14 17:17:05,461 - INFO - Finished converting document 4_2025-04-10 in 0.05 sec.
2025-11-14 17:17:05,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,503 - INFO - Going to convert document batch...
2025-11-14 17:17:05,503 - INFO - Processing document 4_2025-04-16
2025-11-14 17:17:05,525 - INFO - Finished converting document 4_2025-04-16 in 0.03 sec.
2025-11-14 17:17:05,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,566 - INFO - Going to convert document batch...
2025-11-14 17:17:05,567 - 

Converted 'data\edgar_documents\META\4_2025-04-09' --> 'data\processed_data\META\4_2025-04-09.md'
Converted 'data\edgar_documents\META\4_2025-04-10' --> 'data\processed_data\META\4_2025-04-10.md'
Converted 'data\edgar_documents\META\4_2025-04-16' --> 'data\processed_data\META\4_2025-04-16.md'


2025-11-14 17:17:05,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,626 - INFO - Going to convert document batch...
2025-11-14 17:17:05,627 - INFO - Processing document 4_2025-04-23
2025-11-14 17:17:05,652 - INFO - Finished converting document 4_2025-04-23 in 0.06 sec.
2025-11-14 17:17:05,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,696 - INFO - Going to convert document batch...
2025-11-14 17:17:05,697 - INFO - Processing document 4_2025-04-24
2025-11-14 17:17:05,732 - INFO - Finished converting document 4_2025-04-24 in 0.06 sec.
2025-11-14 17:17:05,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,784 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2025-04-17' --> 'data\processed_data\META\4_2025-04-17.md'
Converted 'data\edgar_documents\META\4_2025-04-23' --> 'data\processed_data\META\4_2025-04-23.md'
Converted 'data\edgar_documents\META\4_2025-04-24' --> 'data\processed_data\META\4_2025-04-24.md'


2025-11-14 17:17:05,785 - INFO - Processing document 4_2025-04-30
2025-11-14 17:17:05,808 - INFO - Finished converting document 4_2025-04-30 in 0.05 sec.
2025-11-14 17:17:05,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,854 - INFO - Going to convert document batch...
2025-11-14 17:17:05,855 - INFO - Processing document 4_2025-05-01
2025-11-14 17:17:05,874 - INFO - Finished converting document 4_2025-05-01 in 0.05 sec.
2025-11-14 17:17:05,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:05,921 - INFO - Going to convert document batch...
2025-11-14 17:17:05,921 - INFO - Processing document 4_2025-05-06
2025-11-14 17:17:05,964 - INFO - Finished converting document 4_2025-05-06 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2025-04-30' --> 'data\processed_data\META\4_2025-04-30.md'
Converted 'data\edgar_documents\META\4_2025-05-01' --> 'data\processed_data\META\4_2025-05-01.md'
Converted 'data\edgar_documents\META\4_2025-05-06' --> 'data\processed_data\META\4_2025-05-06.md'


2025-11-14 17:17:06,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:06,036 - INFO - Going to convert document batch...
2025-11-14 17:17:06,037 - INFO - Processing document 4_2025-05-07
2025-11-14 17:17:06,061 - INFO - Finished converting document 4_2025-05-07 in 0.06 sec.
2025-11-14 17:17:06,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:06,103 - INFO - Going to convert document batch...
2025-11-14 17:17:06,104 - INFO - Processing document 4_2025-05-08
2025-11-14 17:17:06,121 - INFO - Finished converting document 4_2025-05-08 in 0.05 sec.
2025-11-14 17:17:06,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:06,162 - INFO - Going to convert document batch...
2025-11-14 17:17:06,163 - INFO - Processing document 4_2025-05-14
2025-11-14 17:17:06,184 - INFO - Finished converting document 4_2025-05-14 in 0.05 sec.
2025-11-14 17:17:06,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\META\4_2025-05-07' --> 'data\processed_data\META\4_2025-05-07.md'
Converted 'data\edgar_documents\META\4_2025-05-08' --> 'data\processed_data\META\4_2025-05-08.md'
Converted 'data\edgar_documents\META\4_2025-05-14' --> 'data\processed_data\META\4_2025-05-14.md'
Converted 'data\edgar_documents\META\4_2025-05-15' --> 'data\processed_data\META\4_2025-05-15.md'


2025-11-14 17:17:06,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:06,319 - INFO - Going to convert document batch...
2025-11-14 17:17:06,319 - INFO - Processing document 4_2025-05-19
2025-11-14 17:17:06,362 - INFO - Finished converting document 4_2025-05-19 in 0.09 sec.
2025-11-14 17:17:06,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:06,416 - INFO - Going to convert document batch...
2025-11-14 17:17:06,416 - INFO - Processing document 4_2025-05-20
2025-11-14 17:17:06,439 - INFO - Finished converting document 4_2025-05-20 in 0.05 sec.
2025-11-14 17:17:06,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:06,483 - INFO - Going to convert document batch...
2025-11-14 17:17:06,484 - INFO - Processing document 4_2025-05-21
2025-11-14 17:17:06,505 - INFO - Finished converting document 4_2025-05-21 in 0.05 sec.
2025-11-14 17:17:06,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\META\4_2025-05-19' --> 'data\processed_data\META\4_2025-05-19.md'
Converted 'data\edgar_documents\META\4_2025-05-20' --> 'data\processed_data\META\4_2025-05-20.md'
Converted 'data\edgar_documents\META\4_2025-05-21' --> 'data\processed_data\META\4_2025-05-21.md'


2025-11-14 17:17:06,779 - INFO - Finished converting document 4_2025-05-22 in 0.25 sec.
2025-11-14 17:17:06,820 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:06,828 - INFO - Going to convert document batch...
2025-11-14 17:17:06,828 - INFO - Processing document 4_2025-05-29
2025-11-14 17:17:06,846 - INFO - Finished converting document 4_2025-05-29 in 0.05 sec.
2025-11-14 17:17:06,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:06,922 - INFO - Going to convert document batch...
2025-11-14 17:17:06,922 - INFO - Processing document 4_2025-06-04
2025-11-14 17:17:06,945 - INFO - Finished converting document 4_2025-06-04 in 0.06 sec.
2025-11-14 17:17:06,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:06,985 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2025-05-22' --> 'data\processed_data\META\4_2025-05-22.md'
Converted 'data\edgar_documents\META\4_2025-05-29' --> 'data\processed_data\META\4_2025-05-29.md'
Converted 'data\edgar_documents\META\4_2025-06-04' --> 'data\processed_data\META\4_2025-06-04.md'


2025-11-14 17:17:06,987 - INFO - Processing document 4_2025-06-05
2025-11-14 17:17:07,004 - INFO - Finished converting document 4_2025-06-05 in 0.03 sec.
2025-11-14 17:17:07,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:07,056 - INFO - Going to convert document batch...
2025-11-14 17:17:07,057 - INFO - Processing document 4_2025-06-09
2025-11-14 17:17:07,102 - INFO - Finished converting document 4_2025-06-09 in 0.08 sec.
2025-11-14 17:17:07,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:07,168 - INFO - Going to convert document batch...
2025-11-14 17:17:07,169 - INFO - Processing document 4_2025-06-11
2025-11-14 17:17:07,219 - INFO - Finished converting document 4_2025-06-11 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2025-06-05' --> 'data\processed_data\META\4_2025-06-05.md'
Converted 'data\edgar_documents\META\4_2025-06-09' --> 'data\processed_data\META\4_2025-06-09.md'


2025-11-14 17:17:07,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:07,299 - INFO - Going to convert document batch...
2025-11-14 17:17:07,300 - INFO - Processing document 4_2025-06-12
2025-11-14 17:17:07,325 - INFO - Finished converting document 4_2025-06-12 in 0.06 sec.
2025-11-14 17:17:07,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:07,395 - INFO - Going to convert document batch...
2025-11-14 17:17:07,396 - INFO - Processing document 4_2025-06-18
2025-11-14 17:17:07,436 - INFO - Finished converting document 4_2025-06-18 in 0.08 sec.


Converted 'data\edgar_documents\META\4_2025-06-11' --> 'data\processed_data\META\4_2025-06-11.md'
Converted 'data\edgar_documents\META\4_2025-06-12' --> 'data\processed_data\META\4_2025-06-12.md'


2025-11-14 17:17:07,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:07,491 - INFO - Going to convert document batch...
2025-11-14 17:17:07,492 - INFO - Processing document 4_2025-06-20
2025-11-14 17:17:07,512 - INFO - Finished converting document 4_2025-06-20 in 0.05 sec.
2025-11-14 17:17:07,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:07,560 - INFO - Going to convert document batch...
2025-11-14 17:17:07,561 - INFO - Processing document 4_2025-06-23
2025-11-14 17:17:07,601 - INFO - Finished converting document 4_2025-06-23 in 0.06 sec.
2025-11-14 17:17:07,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:07,671 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2025-06-18' --> 'data\processed_data\META\4_2025-06-18.md'
Converted 'data\edgar_documents\META\4_2025-06-20' --> 'data\processed_data\META\4_2025-06-20.md'
Converted 'data\edgar_documents\META\4_2025-06-23' --> 'data\processed_data\META\4_2025-06-23.md'


2025-11-14 17:17:07,672 - INFO - Processing document 4_2025-06-25
2025-11-14 17:17:07,729 - INFO - Finished converting document 4_2025-06-25 in 0.09 sec.
2025-11-14 17:17:07,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:07,796 - INFO - Going to convert document batch...
2025-11-14 17:17:07,796 - INFO - Processing document 4_2025-06-26
2025-11-14 17:17:07,815 - INFO - Finished converting document 4_2025-06-26 in 0.03 sec.
2025-11-14 17:17:07,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:07,871 - INFO - Going to convert document batch...
2025-11-14 17:17:07,872 - INFO - Processing document 4_2025-06-30
2025-11-14 17:17:07,923 - INFO - Finished converting document 4_2025-06-30 in 0.09 sec.


Converted 'data\edgar_documents\META\4_2025-06-25' --> 'data\processed_data\META\4_2025-06-25.md'
Converted 'data\edgar_documents\META\4_2025-06-26' --> 'data\processed_data\META\4_2025-06-26.md'
Converted 'data\edgar_documents\META\4_2025-06-30' --> 'data\processed_data\META\4_2025-06-30.md'


2025-11-14 17:17:07,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,020 - INFO - Going to convert document batch...
2025-11-14 17:17:08,021 - INFO - Processing document 4_2025-07-02
2025-11-14 17:17:08,096 - INFO - Finished converting document 4_2025-07-02 in 0.12 sec.
2025-11-14 17:17:08,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,178 - INFO - Going to convert document batch...
2025-11-14 17:17:08,178 - INFO - Processing document 4_2025-07-03
2025-11-14 17:17:08,198 - INFO - Finished converting document 4_2025-07-03 in 0.06 sec.
2025-11-14 17:17:08,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,238 - INFO - Going to convert document batch...
2025-11-14 17:17:08,239 - INFO - Processing document 4_2025-07-09
2025-11-14 17:17:08,262 - INFO - Finished converting document 4_2025-07-09 in 0.05 sec.
2025-11-14 17:17:08,296 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\META\4_2025-07-02' --> 'data\processed_data\META\4_2025-07-02.md'
Converted 'data\edgar_documents\META\4_2025-07-03' --> 'data\processed_data\META\4_2025-07-03.md'
Converted 'data\edgar_documents\META\4_2025-07-09' --> 'data\processed_data\META\4_2025-07-09.md'


2025-11-14 17:17:08,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,362 - INFO - Going to convert document batch...
2025-11-14 17:17:08,363 - INFO - Processing document 4_2025-07-16
2025-11-14 17:17:08,391 - INFO - Finished converting document 4_2025-07-16 in 0.05 sec.
2025-11-14 17:17:08,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,449 - INFO - Going to convert document batch...
2025-11-14 17:17:08,450 - INFO - Processing document 4_2025-07-17
2025-11-14 17:17:08,467 - INFO - Finished converting document 4_2025-07-17 in 0.05 sec.
2025-11-14 17:17:08,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,507 - INFO - Going to convert document batch...
2025-11-14 17:17:08,509 - INFO - Processing document 4_2025-07-23
2025-11-14 17:17:08,531 - INFO - Finished converting document 4_2025-07-23 in 0.05 sec.


Converted 'data\edgar_documents\META\4_2025-07-10' --> 'data\processed_data\META\4_2025-07-10.md'
Converted 'data\edgar_documents\META\4_2025-07-16' --> 'data\processed_data\META\4_2025-07-16.md'
Converted 'data\edgar_documents\META\4_2025-07-17' --> 'data\processed_data\META\4_2025-07-17.md'


2025-11-14 17:17:08,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,573 - INFO - Going to convert document batch...
2025-11-14 17:17:08,574 - INFO - Processing document 4_2025-07-24
2025-11-14 17:17:08,592 - INFO - Finished converting document 4_2025-07-24 in 0.05 sec.
2025-11-14 17:17:08,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,633 - INFO - Going to convert document batch...
2025-11-14 17:17:08,634 - INFO - Processing document 4_2025-07-30
2025-11-14 17:17:08,659 - INFO - Finished converting document 4_2025-07-30 in 0.05 sec.
2025-11-14 17:17:08,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,715 - INFO - Going to convert document batch...
2025-11-14 17:17:08,716 - INFO - Processing document 4_2025-07-31
2025-11-14 17:17:08,732 - INFO - Finished converting document 4_2025-07-31 in 0.06 sec.


Converted 'data\edgar_documents\META\4_2025-07-23' --> 'data\processed_data\META\4_2025-07-23.md'
Converted 'data\edgar_documents\META\4_2025-07-24' --> 'data\processed_data\META\4_2025-07-24.md'
Converted 'data\edgar_documents\META\4_2025-07-30' --> 'data\processed_data\META\4_2025-07-30.md'


2025-11-14 17:17:08,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:08,793 - INFO - Going to convert document batch...
2025-11-14 17:17:08,794 - INFO - Processing document 4_2025-08-04
2025-11-14 17:17:08,866 - INFO - Finished converting document 4_2025-08-04 in 0.11 sec.
2025-11-14 17:17:08,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2025-07-31' --> 'data\processed_data\META\4_2025-07-31.md'
Converted 'data\edgar_documents\META\4_2025-08-04' --> 'data\processed_data\META\4_2025-08-04.md'


2025-11-14 17:17:08,960 - INFO - Going to convert document batch...
2025-11-14 17:17:08,960 - INFO - Processing document 4_2025-08-05
2025-11-14 17:17:08,988 - INFO - Finished converting document 4_2025-08-05 in 0.05 sec.
2025-11-14 17:17:09,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:09,050 - INFO - Going to convert document batch...
2025-11-14 17:17:09,051 - INFO - Processing document 4_2025-08-06
2025-11-14 17:17:09,115 - INFO - Finished converting document 4_2025-08-06 in 0.09 sec.
2025-11-14 17:17:09,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:09,189 - INFO - Going to convert document batch...
2025-11-14 17:17:09,190 - INFO - Processing document 4_2025-08-07
2025-11-14 17:17:09,208 - INFO - Finished converting document 4_2025-08-07 in 0.03 sec.


Converted 'data\edgar_documents\META\4_2025-08-05' --> 'data\processed_data\META\4_2025-08-05.md'
Converted 'data\edgar_documents\META\4_2025-08-06' --> 'data\processed_data\META\4_2025-08-06.md'


2025-11-14 17:17:09,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:09,253 - INFO - Going to convert document batch...
2025-11-14 17:17:09,253 - INFO - Processing document 4_2025-08-08
2025-11-14 17:17:09,287 - INFO - Finished converting document 4_2025-08-08 in 0.05 sec.
2025-11-14 17:17:09,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:09,386 - INFO - Going to convert document batch...
2025-11-14 17:17:09,387 - INFO - Processing document 4_2025-08-11


Converted 'data\edgar_documents\META\4_2025-08-07' --> 'data\processed_data\META\4_2025-08-07.md'
Converted 'data\edgar_documents\META\4_2025-08-08' --> 'data\processed_data\META\4_2025-08-08.md'


2025-11-14 17:17:09,458 - INFO - Finished converting document 4_2025-08-11 in 0.12 sec.
2025-11-14 17:17:09,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:09,554 - INFO - Going to convert document batch...
2025-11-14 17:17:09,555 - INFO - Processing document 4_2025-08-13
2025-11-14 17:17:09,621 - INFO - Finished converting document 4_2025-08-13 in 0.11 sec.
2025-11-14 17:17:09,696 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:09,704 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2025-08-11' --> 'data\processed_data\META\4_2025-08-11.md'
Converted 'data\edgar_documents\META\4_2025-08-13' --> 'data\processed_data\META\4_2025-08-13.md'


2025-11-14 17:17:09,705 - INFO - Processing document 4_2025-08-19
2025-11-14 17:17:09,725 - INFO - Finished converting document 4_2025-08-19 in 0.05 sec.
2025-11-14 17:17:09,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:09,771 - INFO - Going to convert document batch...
2025-11-14 17:17:09,772 - INFO - Processing document 4_2025-08-27
2025-11-14 17:17:09,797 - INFO - Finished converting document 4_2025-08-27 in 0.05 sec.
2025-11-14 17:17:09,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:09,859 - INFO - Going to convert document batch...
2025-11-14 17:17:09,860 - INFO - Processing document 4_2025-08-28
2025-11-14 17:17:09,879 - INFO - Finished converting document 4_2025-08-28 in 0.06 sec.
2025-11-14 17:17:09,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:09,918 - INFO - Going to convert document batch...
2025-11-14 17:17:09,919 - INFO - Processing document 4_2025-09-04


Converted 'data\edgar_documents\META\4_2025-08-19' --> 'data\processed_data\META\4_2025-08-19.md'
Converted 'data\edgar_documents\META\4_2025-08-27' --> 'data\processed_data\META\4_2025-08-27.md'
Converted 'data\edgar_documents\META\4_2025-08-28' --> 'data\processed_data\META\4_2025-08-28.md'


2025-11-14 17:17:10,139 - INFO - Finished converting document 4_2025-09-04 in 0.25 sec.
2025-11-14 17:17:10,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,186 - INFO - Going to convert document batch...
2025-11-14 17:17:10,186 - INFO - Processing document 4_2025-09-10
2025-11-14 17:17:10,208 - INFO - Finished converting document 4_2025-09-10 in 0.05 sec.
2025-11-14 17:17:10,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,248 - INFO - Going to convert document batch...
2025-11-14 17:17:10,248 - INFO - Processing document 4_2025-09-11
2025-11-14 17:17:10,267 - INFO - Finished converting document 4_2025-09-11 in 0.03 sec.
2025-11-14 17:17:10,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,307 - INFO - Going to convert document batch...
2025-11-14 17:17:10,307 - INFO - Processing document 4_2025-09-17
2025-11-14 17:17:10,329 - INFO - Finished converting document 4_2025-09-17 in 0.05 sec.
2025-1

Converted 'data\edgar_documents\META\4_2025-09-04' --> 'data\processed_data\META\4_2025-09-04.md'
Converted 'data\edgar_documents\META\4_2025-09-10' --> 'data\processed_data\META\4_2025-09-10.md'
Converted 'data\edgar_documents\META\4_2025-09-11' --> 'data\processed_data\META\4_2025-09-11.md'
Converted 'data\edgar_documents\META\4_2025-09-17' --> 'data\processed_data\META\4_2025-09-17.md'


2025-11-14 17:17:10,370 - INFO - Going to convert document batch...
2025-11-14 17:17:10,371 - INFO - Processing document 4_2025-09-18
2025-11-14 17:17:10,388 - INFO - Finished converting document 4_2025-09-18 in 0.05 sec.
2025-11-14 17:17:10,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,430 - INFO - Going to convert document batch...
2025-11-14 17:17:10,431 - INFO - Processing document 4_2025-09-24
2025-11-14 17:17:10,455 - INFO - Finished converting document 4_2025-09-24 in 0.05 sec.
2025-11-14 17:17:10,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,497 - INFO - Going to convert document batch...
2025-11-14 17:17:10,498 - INFO - Processing document 4_2025-09-25
2025-11-14 17:17:10,516 - INFO - Finished converting document 4_2025-09-25 in 0.05 sec.
2025-11-14 17:17:10,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,554 - INFO - Going to convert document batch...
2025-11-14 17:17:10,554 - 

Converted 'data\edgar_documents\META\4_2025-09-18' --> 'data\processed_data\META\4_2025-09-18.md'
Converted 'data\edgar_documents\META\4_2025-09-24' --> 'data\processed_data\META\4_2025-09-24.md'
Converted 'data\edgar_documents\META\4_2025-09-25' --> 'data\processed_data\META\4_2025-09-25.md'


2025-11-14 17:17:10,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,618 - INFO - Going to convert document batch...
2025-11-14 17:17:10,619 - INFO - Processing document 4_2025-10-02
2025-11-14 17:17:10,637 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 17:17:10,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,681 - INFO - Going to convert document batch...
2025-11-14 17:17:10,682 - INFO - Processing document 4_2025-10-08
2025-11-14 17:17:10,706 - INFO - Finished converting document 4_2025-10-08 in 0.05 sec.
2025-11-14 17:17:10,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,777 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\META\4_2025-10-01' --> 'data\processed_data\META\4_2025-10-01.md'
Converted 'data\edgar_documents\META\4_2025-10-02' --> 'data\processed_data\META\4_2025-10-02.md'
Converted 'data\edgar_documents\META\4_2025-10-08' --> 'data\processed_data\META\4_2025-10-08.md'


2025-11-14 17:17:10,778 - INFO - Processing document 4_2025-10-09
2025-11-14 17:17:10,796 - INFO - Finished converting document 4_2025-10-09 in 0.06 sec.
2025-11-14 17:17:10,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,843 - INFO - Going to convert document batch...
2025-11-14 17:17:10,844 - INFO - Processing document 4_2025-10-15
2025-11-14 17:17:10,867 - INFO - Finished converting document 4_2025-10-15 in 0.05 sec.
2025-11-14 17:17:10,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,909 - INFO - Going to convert document batch...
2025-11-14 17:17:10,910 - INFO - Processing document 4_2025-10-16
2025-11-14 17:17:10,929 - INFO - Finished converting document 4_2025-10-16 in 0.03 sec.
2025-11-14 17:17:10,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:10,969 - INFO - Going to convert document batch...
2025-11-14 17:17:10,970 - INFO - Processing document 4_2025-10-17
2025-11-14 17:17:10,987 - IN

Converted 'data\edgar_documents\META\4_2025-10-09' --> 'data\processed_data\META\4_2025-10-09.md'
Converted 'data\edgar_documents\META\4_2025-10-15' --> 'data\processed_data\META\4_2025-10-15.md'
Converted 'data\edgar_documents\META\4_2025-10-16' --> 'data\processed_data\META\4_2025-10-16.md'


2025-11-14 17:17:11,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,024 - INFO - Going to convert document batch...
2025-11-14 17:17:11,025 - INFO - Processing document 4_2025-10-22
2025-11-14 17:17:11,051 - INFO - Finished converting document 4_2025-10-22 in 0.05 sec.
2025-11-14 17:17:11,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,094 - INFO - Going to convert document batch...
2025-11-14 17:17:11,095 - INFO - Processing document 4_2025-10-23
2025-11-14 17:17:11,112 - INFO - Finished converting document 4_2025-10-23 in 0.03 sec.
2025-11-14 17:17:11,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,177 - INFO - Going to convert document batch...
2025-11-14 17:17:11,177 - INFO - Processing document 4_2025-10-29
2025-11-14 17:17:11,201 - INFO - Finished converting document 4_2025-10-29 in 0.06 sec.


Converted 'data\edgar_documents\META\4_2025-10-17' --> 'data\processed_data\META\4_2025-10-17.md'
Converted 'data\edgar_documents\META\4_2025-10-22' --> 'data\processed_data\META\4_2025-10-22.md'
Converted 'data\edgar_documents\META\4_2025-10-23' --> 'data\processed_data\META\4_2025-10-23.md'


2025-11-14 17:17:11,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,242 - INFO - Going to convert document batch...
2025-11-14 17:17:11,242 - INFO - Processing document 4_2025-10-30
2025-11-14 17:17:11,262 - INFO - Finished converting document 4_2025-10-30 in 0.05 sec.
2025-11-14 17:17:11,304 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:17:11,305 - ERROR - Input document 4_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:17

Converted 'data\edgar_documents\META\4_2025-10-29' --> 'data\processed_data\META\4_2025-10-29.md'
Converted 'data\edgar_documents\META\4_2025-10-30' --> 'data\processed_data\META\4_2025-10-30.md'
Error processing data\edgar_documents\META\4_2025-11-03: File format not allowed: data\edgar_documents\META\4_2025-11-03


2025-11-14 17:17:11,432 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,441 - INFO - Going to convert document batch...
2025-11-14 17:17:11,442 - INFO - Processing document 4_2025-11-05
2025-11-14 17:17:11,476 - INFO - Finished converting document 4_2025-11-05 in 0.05 sec.
2025-11-14 17:17:11,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,557 - INFO - Going to convert document batch...
2025-11-14 17:17:11,557 - INFO - Processing document 4_2025-11-06
2025-11-14 17:17:11,577 - INFO - Finished converting document 4_2025-11-06 in 0.06 sec.
2025-11-14 17:17:11,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\4_2025-11-04' --> 'data\processed_data\META\4_2025-11-04.md'
Converted 'data\edgar_documents\META\4_2025-11-05' --> 'data\processed_data\META\4_2025-11-05.md'
Converted 'data\edgar_documents\META\4_2025-11-06' --> 'data\processed_data\META\4_2025-11-06.md'


2025-11-14 17:17:11,623 - INFO - Going to convert document batch...
2025-11-14 17:17:11,623 - INFO - Processing document 8-K_2023-02-01
2025-11-14 17:17:11,643 - INFO - Finished converting document 8-K_2023-02-01 in 0.05 sec.
2025-11-14 17:17:11,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,684 - INFO - Going to convert document batch...
2025-11-14 17:17:11,685 - INFO - Processing document 8-K_2023-02-02
2025-11-14 17:17:11,701 - INFO - Finished converting document 8-K_2023-02-02 in 0.05 sec.
2025-11-14 17:17:11,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,736 - INFO - Going to convert document batch...
2025-11-14 17:17:11,736 - INFO - Processing document 8-K_2023-02-13
2025-11-14 17:17:11,754 - INFO - Finished converting document 8-K_2023-02-13 in 0.05 sec.
2025-11-14 17:17:11,777 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,790 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\META\8-K_2023-02-01' --> 'data\processed_data\META\8-K_2023-02-01.md'
Converted 'data\edgar_documents\META\8-K_2023-02-02' --> 'data\processed_data\META\8-K_2023-02-02.md'
Converted 'data\edgar_documents\META\8-K_2023-02-13' --> 'data\processed_data\META\8-K_2023-02-13.md'
Converted 'data\edgar_documents\META\8-K_2023-02-15' --> 'data\processed_data\META\8-K_2023-02-15.md'


2025-11-14 17:17:11,841 - INFO - Processing document 8-K_2023-03-14
2025-11-14 17:17:11,860 - INFO - Finished converting document 8-K_2023-03-14 in 0.05 sec.
2025-11-14 17:17:11,889 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:11,903 - INFO - Going to convert document batch...
2025-11-14 17:17:11,904 - INFO - Processing document 8-K_2023-04-10
2025-11-14 17:17:11,922 - INFO - Finished converting document 8-K_2023-04-10 in 0.05 sec.
2025-11-14 17:17:11,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,002 - INFO - Going to convert document batch...
2025-11-14 17:17:12,003 - INFO - Processing document 8-K_2023-04-26
2025-11-14 17:17:12,022 - INFO - Finished converting document 8-K_2023-04-26 in 0.06 sec.
2025-11-14 17:17:12,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,056 - INFO - Going to convert document batch...
2025-11-14 17:17:12,057 - INFO - Processing document 8-K_2023-05-03


Converted 'data\edgar_documents\META\8-K_2023-03-14' --> 'data\processed_data\META\8-K_2023-03-14.md'
Converted 'data\edgar_documents\META\8-K_2023-04-10' --> 'data\processed_data\META\8-K_2023-04-10.md'
Converted 'data\edgar_documents\META\8-K_2023-04-26' --> 'data\processed_data\META\8-K_2023-04-26.md'


2025-11-14 17:17:12,079 - INFO - Finished converting document 8-K_2023-05-03 in 0.05 sec.
2025-11-14 17:17:12,108 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,137 - INFO - Going to convert document batch...
2025-11-14 17:17:12,138 - INFO - Processing document 8-K_2023-06-02
2025-11-14 17:17:12,184 - INFO - Finished converting document 8-K_2023-06-02 in 0.09 sec.
2025-11-14 17:17:12,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,232 - INFO - Going to convert document batch...
2025-11-14 17:17:12,233 - INFO - Processing document 8-K_2023-07-26
2025-11-14 17:17:12,250 - INFO - Finished converting document 8-K_2023-07-26 in 0.05 sec.
2025-11-14 17:17:12,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\8-K_2023-05-03' --> 'data\processed_data\META\8-K_2023-05-03.md'
Converted 'data\edgar_documents\META\8-K_2023-06-02' --> 'data\processed_data\META\8-K_2023-06-02.md'
Converted 'data\edgar_documents\META\8-K_2023-07-26' --> 'data\processed_data\META\8-K_2023-07-26.md'


2025-11-14 17:17:12,313 - INFO - Going to convert document batch...
2025-11-14 17:17:12,315 - INFO - Processing document 8-K_2023-10-25
2025-11-14 17:17:12,334 - INFO - Finished converting document 8-K_2023-10-25 in 0.06 sec.
2025-11-14 17:17:12,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,373 - INFO - Going to convert document batch...
2025-11-14 17:17:12,374 - INFO - Processing document 8-K_2024-01-18
2025-11-14 17:17:12,396 - INFO - Finished converting document 8-K_2024-01-18 in 0.05 sec.
2025-11-14 17:17:12,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,455 - INFO - Going to convert document batch...
2025-11-14 17:17:12,456 - INFO - Processing document 8-K_2024-02-01
2025-11-14 17:17:12,476 - INFO - Finished converting document 8-K_2024-02-01 in 0.05 sec.
2025-11-14 17:17:12,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,510 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\META\8-K_2023-10-25' --> 'data\processed_data\META\8-K_2023-10-25.md'
Converted 'data\edgar_documents\META\8-K_2024-01-18' --> 'data\processed_data\META\8-K_2024-01-18.md'
Converted 'data\edgar_documents\META\8-K_2024-02-01' --> 'data\processed_data\META\8-K_2024-02-01.md'


2025-11-14 17:17:12,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,564 - INFO - Going to convert document batch...
2025-11-14 17:17:12,565 - INFO - Processing document 8-K_2024-04-24
2025-11-14 17:17:12,586 - INFO - Finished converting document 8-K_2024-04-24 in 0.03 sec.
2025-11-14 17:17:12,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,657 - INFO - Going to convert document batch...
2025-11-14 17:17:12,657 - INFO - Processing document 8-K_2024-05-31
2025-11-14 17:17:12,704 - INFO - Finished converting document 8-K_2024-05-31 in 0.11 sec.
2025-11-14 17:17:12,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\8-K_2024-02-14' --> 'data\processed_data\META\8-K_2024-02-14.md'
Converted 'data\edgar_documents\META\8-K_2024-04-24' --> 'data\processed_data\META\8-K_2024-04-24.md'
Converted 'data\edgar_documents\META\8-K_2024-05-31' --> 'data\processed_data\META\8-K_2024-05-31.md'


2025-11-14 17:17:12,748 - INFO - Going to convert document batch...
2025-11-14 17:17:12,749 - INFO - Processing document 8-K_2024-07-31
2025-11-14 17:17:12,767 - INFO - Finished converting document 8-K_2024-07-31 in 0.05 sec.
2025-11-14 17:17:12,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,808 - INFO - Going to convert document batch...
2025-11-14 17:17:12,808 - INFO - Processing document 8-K_2024-08-09
2025-11-14 17:17:12,832 - INFO - Finished converting document 8-K_2024-08-09 in 0.05 sec.
2025-11-14 17:17:12,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,892 - INFO - Going to convert document batch...
2025-11-14 17:17:12,893 - INFO - Processing document 8-K_2024-09-10
2025-11-14 17:17:12,916 - INFO - Finished converting document 8-K_2024-09-10 in 0.06 sec.
2025-11-14 17:17:12,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:12,952 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\META\8-K_2024-07-31' --> 'data\processed_data\META\8-K_2024-07-31.md'
Converted 'data\edgar_documents\META\8-K_2024-08-09' --> 'data\processed_data\META\8-K_2024-08-09.md'
Converted 'data\edgar_documents\META\8-K_2024-09-10' --> 'data\processed_data\META\8-K_2024-09-10.md'


2025-11-14 17:17:12,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:13,006 - INFO - Going to convert document batch...
2025-11-14 17:17:13,007 - INFO - Processing document 8-K_2025-01-06
2025-11-14 17:17:13,027 - INFO - Finished converting document 8-K_2025-01-06 in 0.05 sec.
2025-11-14 17:17:13,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:13,063 - INFO - Going to convert document batch...
2025-11-14 17:17:13,064 - INFO - Processing document 8-K_2025-01-29
2025-11-14 17:17:13,083 - INFO - Finished converting document 8-K_2025-01-29 in 0.05 sec.
2025-11-14 17:17:13,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:13,120 - INFO - Going to convert document batch...
2025-11-14 17:17:13,121 - INFO - Processing document 8-K_2025-02-20
2025-11-14 17:17:13,140 - INFO - Finished converting document 8-K_2025-02-20 in 0.05 sec.
2025-11-14 17:17:13,161 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\META\8-K_2024-10-30' --> 'data\processed_data\META\8-K_2024-10-30.md'
Converted 'data\edgar_documents\META\8-K_2025-01-06' --> 'data\processed_data\META\8-K_2025-01-06.md'
Converted 'data\edgar_documents\META\8-K_2025-01-29' --> 'data\processed_data\META\8-K_2025-01-29.md'
Converted 'data\edgar_documents\META\8-K_2025-02-20' --> 'data\processed_data\META\8-K_2025-02-20.md'


2025-11-14 17:17:13,173 - INFO - Processing document 8-K_2025-04-11
2025-11-14 17:17:13,199 - INFO - Finished converting document 8-K_2025-04-11 in 0.05 sec.
2025-11-14 17:17:13,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:13,254 - INFO - Going to convert document batch...
2025-11-14 17:17:13,255 - INFO - Processing document 8-K_2025-04-30
2025-11-14 17:17:13,281 - INFO - Finished converting document 8-K_2025-04-30 in 0.06 sec.
2025-11-14 17:17:13,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:13,334 - INFO - Going to convert document batch...
2025-11-14 17:17:13,335 - INFO - Processing document 8-K_2025-05-30
2025-11-14 17:17:13,383 - INFO - Finished converting document 8-K_2025-05-30 in 0.08 sec.


Converted 'data\edgar_documents\META\8-K_2025-04-11' --> 'data\processed_data\META\8-K_2025-04-11.md'
Converted 'data\edgar_documents\META\8-K_2025-04-30' --> 'data\processed_data\META\8-K_2025-04-30.md'
Converted 'data\edgar_documents\META\8-K_2025-05-30' --> 'data\processed_data\META\8-K_2025-05-30.md'


2025-11-14 17:17:13,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:13,431 - INFO - Going to convert document batch...
2025-11-14 17:17:13,432 - INFO - Processing document 8-K_2025-07-30
2025-11-14 17:17:13,452 - INFO - Finished converting document 8-K_2025-07-30 in 0.05 sec.
2025-11-14 17:17:13,481 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:13,491 - INFO - Going to convert document batch...
2025-11-14 17:17:13,491 - INFO - Processing document 8-K_2025-10-29
2025-11-14 17:17:13,510 - INFO - Finished converting document 8-K_2025-10-29 in 0.03 sec.
2025-11-14 17:17:13,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:13,546 - INFO - Going to convert document batch...
2025-11-14 17:17:13,547 - INFO - Processing document 8-K_2025-11-03
2025-11-14 17:17:13,568 - INFO - Finished converting document 8-K_2025-11-03 in 0.05 sec.
2025-11-14 17:17:13,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\8-K_2025-07-30' --> 'data\processed_data\META\8-K_2025-07-30.md'
Converted 'data\edgar_documents\META\8-K_2025-10-29' --> 'data\processed_data\META\8-K_2025-10-29.md'
Converted 'data\edgar_documents\META\8-K_2025-11-03' --> 'data\processed_data\META\8-K_2025-11-03.md'


2025-11-14 17:17:14,130 - INFO - Going to convert document batch...
2025-11-14 17:17:14,131 - INFO - Processing document DEF-14A_2023-04-14
2025-11-14 17:17:15,259 - INFO - Finished converting document DEF-14A_2023-04-14 in 1.67 sec.
2025-11-14 17:17:15,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\DEF-14A_2023-04-14' --> 'data\processed_data\META\DEF-14A_2023-04-14.md'


2025-11-14 17:17:16,321 - INFO - Going to convert document batch...
2025-11-14 17:17:16,321 - INFO - Processing document DEF-14A_2024-04-19
2025-11-14 17:17:17,587 - INFO - Finished converting document DEF-14A_2024-04-19 in 1.84 sec.
2025-11-14 17:17:18,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\DEF-14A_2024-04-19' --> 'data\processed_data\META\DEF-14A_2024-04-19.md'


2025-11-14 17:17:18,431 - INFO - Going to convert document batch...
2025-11-14 17:17:18,432 - INFO - Processing document DEF-14A_2025-04-17
2025-11-14 17:17:19,545 - INFO - Finished converting document DEF-14A_2025-04-17 in 1.45 sec.
2025-11-14 17:17:20,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\META\DEF-14A_2025-04-17' --> 'data\processed_data\META\DEF-14A_2025-04-17.md'
Processed 363 new files. Errors: 3
Found 127 files to process in data\edgar_documents\MMM


2025-11-14 17:17:21,957 - INFO - Going to convert document batch...
2025-11-14 17:17:21,958 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:17:21,959 - INFO - Processing document 10-K_2023-02-08
2025-11-14 17:17:23,995 - INFO - Finished converting document 10-K_2023-02-08 in 3.94 sec.
2025-11-14 17:17:25,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\10-K_2023-02-08' --> 'data\processed_data\MMM\10-K_2023-02-08.md'


2025-11-14 17:17:26,280 - INFO - Going to convert document batch...
2025-11-14 17:17:26,281 - INFO - Processing document 10-K_2024-02-07
2025-11-14 17:17:28,006 - INFO - Finished converting document 10-K_2024-02-07 in 3.06 sec.
2025-11-14 17:17:28,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\10-K_2024-02-07' --> 'data\processed_data\MMM\10-K_2024-02-07.md'


2025-11-14 17:17:30,565 - INFO - Going to convert document batch...
2025-11-14 17:17:30,566 - INFO - Processing document 10-K_2025-02-05
2025-11-14 17:17:32,816 - INFO - Finished converting document 10-K_2025-02-05 in 3.94 sec.
2025-11-14 17:17:33,776 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:17:33,777 - ERROR - Input document 10-Q_2023-04-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:17:33,779 - INFO - Going to convert d

Converted 'data\edgar_documents\MMM\10-K_2025-02-05' --> 'data\processed_data\MMM\10-K_2025-02-05.md'
Error processing data\edgar_documents\MMM\10-Q_2023-04-25: File format not allowed: data\edgar_documents\MMM\10-Q_2023-04-25


2025-11-14 17:17:34,489 - INFO - Going to convert document batch...
2025-11-14 17:17:34,490 - INFO - Processing document 10-Q_2023-07-25
2025-11-14 17:17:35,834 - INFO - Finished converting document 10-Q_2023-07-25 in 2.05 sec.
2025-11-14 17:17:36,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\10-Q_2023-07-25' --> 'data\processed_data\MMM\10-Q_2023-07-25.md'


2025-11-14 17:17:37,812 - INFO - Going to convert document batch...
2025-11-14 17:17:37,813 - INFO - Processing document 10-Q_2023-10-24
2025-11-14 17:17:39,132 - INFO - Finished converting document 10-Q_2023-10-24 in 2.58 sec.
2025-11-14 17:17:39,900 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:17:39,901 - ERROR - Input document 10-Q_2024-04-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:17:39,903 - INFO - Going to convert d

Converted 'data\edgar_documents\MMM\10-Q_2023-10-24' --> 'data\processed_data\MMM\10-Q_2023-10-24.md'
Error processing data\edgar_documents\MMM\10-Q_2024-04-30: File format not allowed: data\edgar_documents\MMM\10-Q_2024-04-30


2025-11-14 17:17:40,950 - INFO - Going to convert document batch...
2025-11-14 17:17:40,951 - INFO - Processing document 10-Q_2024-07-26
2025-11-14 17:17:42,190 - INFO - Finished converting document 10-Q_2024-07-26 in 2.28 sec.
2025-11-14 17:17:42,950 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\10-Q_2024-07-26' --> 'data\processed_data\MMM\10-Q_2024-07-26.md'


2025-11-14 17:17:43,983 - INFO - Going to convert document batch...
2025-11-14 17:17:43,984 - INFO - Processing document 10-Q_2024-10-22
2025-11-14 17:17:45,255 - INFO - Finished converting document 10-Q_2024-10-22 in 2.36 sec.
2025-11-14 17:17:45,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\10-Q_2024-10-22' --> 'data\processed_data\MMM\10-Q_2024-10-22.md'


2025-11-14 17:17:46,900 - INFO - Going to convert document batch...
2025-11-14 17:17:46,901 - INFO - Processing document 10-Q_2025-04-22
2025-11-14 17:17:47,760 - INFO - Finished converting document 10-Q_2025-04-22 in 1.81 sec.
2025-11-14 17:17:48,305 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:17:48,306 - ERROR - Input document 10-Q_2025-07-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:17:48,309 - INFO - Going to convert d

Converted 'data\edgar_documents\MMM\10-Q_2025-04-22' --> 'data\processed_data\MMM\10-Q_2025-04-22.md'
Error processing data\edgar_documents\MMM\10-Q_2025-07-18: File format not allowed: data\edgar_documents\MMM\10-Q_2025-07-18


2025-11-14 17:17:49,382 - INFO - Going to convert document batch...
2025-11-14 17:17:49,383 - INFO - Processing document 10-Q_2025-10-21
2025-11-14 17:17:50,720 - INFO - Finished converting document 10-Q_2025-10-21 in 2.41 sec.
2025-11-14 17:17:51,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:51,474 - INFO - Going to convert document batch...
2025-11-14 17:17:51,475 - INFO - Processing document 4_2023-01-27
2025-11-14 17:17:51,492 - INFO - Finished converting document 4_2023-01-27 in 0.05 sec.
2025-11-14 17:17:51,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:51,567 - INFO - Going to convert document batch...
2025-11-14 17:17:51,568 - INFO - Processing document 4_2023-02-06
2025-11-14 17:17:51,587 - INFO - Finished converting document 4_2023-02-06 in 0.06 sec.


Converted 'data\edgar_documents\MMM\10-Q_2025-10-21' --> 'data\processed_data\MMM\10-Q_2025-10-21.md'
Converted 'data\edgar_documents\MMM\4_2023-01-27' --> 'data\processed_data\MMM\4_2023-01-27.md'
Converted 'data\edgar_documents\MMM\4_2023-02-06' --> 'data\processed_data\MMM\4_2023-02-06.md'


2025-11-14 17:17:51,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:51,645 - INFO - Going to convert document batch...
2025-11-14 17:17:51,646 - INFO - Processing document 4_2023-02-07
2025-11-14 17:17:51,667 - INFO - Finished converting document 4_2023-02-07 in 0.06 sec.
2025-11-14 17:17:51,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:51,722 - INFO - Going to convert document batch...
2025-11-14 17:17:51,723 - INFO - Processing document 4_2023-02-08
2025-11-14 17:17:51,744 - INFO - Finished converting document 4_2023-02-08 in 0.06 sec.
2025-11-14 17:17:51,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:51,800 - INFO - Going to convert document batch...
2025-11-14 17:17:51,801 - INFO - Processing document 4_2023-02-10
2025-11-14 17:17:51,818 - INFO - Finished converting document 4_2023-02-10 in 0.05 sec.
2025-11-14 17:17:51,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\MMM\4_2023-02-07' --> 'data\processed_data\MMM\4_2023-02-07.md'
Converted 'data\edgar_documents\MMM\4_2023-02-08' --> 'data\processed_data\MMM\4_2023-02-08.md'
Converted 'data\edgar_documents\MMM\4_2023-02-10' --> 'data\processed_data\MMM\4_2023-02-10.md'


2025-11-14 17:17:51,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:51,928 - INFO - Going to convert document batch...
2025-11-14 17:17:51,929 - INFO - Processing document 4_2023-02-23
2025-11-14 17:17:51,947 - INFO - Finished converting document 4_2023-02-23 in 0.03 sec.
2025-11-14 17:17:51,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,009 - INFO - Going to convert document batch...
2025-11-14 17:17:52,011 - INFO - Processing document 4_2023-04-28
2025-11-14 17:17:52,049 - INFO - Finished converting document 4_2023-04-28 in 0.08 sec.
2025-11-14 17:17:52,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\4_2023-02-21' --> 'data\processed_data\MMM\4_2023-02-21.md'
Converted 'data\edgar_documents\MMM\4_2023-02-23' --> 'data\processed_data\MMM\4_2023-02-23.md'
Converted 'data\edgar_documents\MMM\4_2023-04-28' --> 'data\processed_data\MMM\4_2023-04-28.md'


2025-11-14 17:17:52,109 - INFO - Going to convert document batch...
2025-11-14 17:17:52,110 - INFO - Processing document 4_2023-05-01
2025-11-14 17:17:52,129 - INFO - Finished converting document 4_2023-05-01 in 0.05 sec.
2025-11-14 17:17:52,176 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,185 - INFO - Going to convert document batch...
2025-11-14 17:17:52,185 - INFO - Processing document 4_2023-05-02
2025-11-14 17:17:52,205 - INFO - Finished converting document 4_2023-05-02 in 0.05 sec.
2025-11-14 17:17:52,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,248 - INFO - Going to convert document batch...
2025-11-14 17:17:52,249 - INFO - Processing document 4_2023-05-10
2025-11-14 17:17:52,269 - INFO - Finished converting document 4_2023-05-10 in 0.03 sec.
2025-11-14 17:17:52,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,340 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MMM\4_2023-05-01' --> 'data\processed_data\MMM\4_2023-05-01.md'
Converted 'data\edgar_documents\MMM\4_2023-05-02' --> 'data\processed_data\MMM\4_2023-05-02.md'
Converted 'data\edgar_documents\MMM\4_2023-05-10' --> 'data\processed_data\MMM\4_2023-05-10.md'


2025-11-14 17:17:52,341 - INFO - Processing document 4_2023-05-19
2025-11-14 17:17:52,359 - INFO - Finished converting document 4_2023-05-19 in 0.06 sec.
2025-11-14 17:17:52,413 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,422 - INFO - Going to convert document batch...
2025-11-14 17:17:52,423 - INFO - Processing document 4_2023-07-05
2025-11-14 17:17:52,456 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 17:17:52,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,557 - INFO - Going to convert document batch...
2025-11-14 17:17:52,558 - INFO - Processing document 4_2023-07-28
2025-11-14 17:17:52,582 - INFO - Finished converting document 4_2023-07-28 in 0.08 sec.


Converted 'data\edgar_documents\MMM\4_2023-05-19' --> 'data\processed_data\MMM\4_2023-05-19.md'
Converted 'data\edgar_documents\MMM\4_2023-07-05' --> 'data\processed_data\MMM\4_2023-07-05.md'


2025-11-14 17:17:52,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,635 - INFO - Going to convert document batch...
2025-11-14 17:17:52,636 - INFO - Processing document 4_2023-08-11
2025-11-14 17:17:52,656 - INFO - Finished converting document 4_2023-08-11 in 0.06 sec.
2025-11-14 17:17:52,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,706 - INFO - Going to convert document batch...
2025-11-14 17:17:52,707 - INFO - Processing document 4_2023-09-06
2025-11-14 17:17:52,726 - INFO - Finished converting document 4_2023-09-06 in 0.05 sec.
2025-11-14 17:17:52,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,773 - INFO - Going to convert document batch...
2025-11-14 17:17:52,773 - INFO - Processing document 4_2023-10-05
2025-11-14 17:17:52,794 - INFO - Finished converting document 4_2023-10-05 in 0.05 sec.


Converted 'data\edgar_documents\MMM\4_2023-07-28' --> 'data\processed_data\MMM\4_2023-07-28.md'
Converted 'data\edgar_documents\MMM\4_2023-08-11' --> 'data\processed_data\MMM\4_2023-08-11.md'
Converted 'data\edgar_documents\MMM\4_2023-09-06' --> 'data\processed_data\MMM\4_2023-09-06.md'


2025-11-14 17:17:52,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,849 - INFO - Going to convert document batch...
2025-11-14 17:17:52,850 - INFO - Processing document 4_2023-10-27
2025-11-14 17:17:52,869 - INFO - Finished converting document 4_2023-10-27 in 0.06 sec.
2025-11-14 17:17:52,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,917 - INFO - Going to convert document batch...
2025-11-14 17:17:52,917 - INFO - Processing document 4_2023-11-08
2025-11-14 17:17:52,935 - INFO - Finished converting document 4_2023-11-08 in 0.05 sec.
2025-11-14 17:17:52,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:52,988 - INFO - Going to convert document batch...
2025-11-14 17:17:52,989 - INFO - Processing document 4_2023-12-04


Converted 'data\edgar_documents\MMM\4_2023-10-05' --> 'data\processed_data\MMM\4_2023-10-05.md'
Converted 'data\edgar_documents\MMM\4_2023-10-27' --> 'data\processed_data\MMM\4_2023-10-27.md'
Converted 'data\edgar_documents\MMM\4_2023-11-08' --> 'data\processed_data\MMM\4_2023-11-08.md'


2025-11-14 17:17:53,011 - INFO - Finished converting document 4_2023-12-04 in 0.06 sec.
2025-11-14 17:17:53,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,055 - INFO - Going to convert document batch...
2025-11-14 17:17:53,056 - INFO - Processing document 4_2023-12-26
2025-11-14 17:17:53,074 - INFO - Finished converting document 4_2023-12-26 in 0.05 sec.
2025-11-14 17:17:53,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,120 - INFO - Going to convert document batch...
2025-11-14 17:17:53,121 - INFO - Processing document 4_2024-01-26
2025-11-14 17:17:53,139 - INFO - Finished converting document 4_2024-01-26 in 0.05 sec.
2025-11-14 17:17:53,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,199 - INFO - Going to convert document batch...
2025-11-14 17:17:53,200 - INFO - Processing document 4_2024-02-05
2025-11-14 17:17:53,222 - INFO - Finished converting document 4_2024-02-05 in 0.05 sec.


Converted 'data\edgar_documents\MMM\4_2023-12-04' --> 'data\processed_data\MMM\4_2023-12-04.md'
Converted 'data\edgar_documents\MMM\4_2023-12-26' --> 'data\processed_data\MMM\4_2023-12-26.md'
Converted 'data\edgar_documents\MMM\4_2024-01-26' --> 'data\processed_data\MMM\4_2024-01-26.md'


2025-11-14 17:17:53,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,269 - INFO - Going to convert document batch...
2025-11-14 17:17:53,270 - INFO - Processing document 4_2024-02-06
2025-11-14 17:17:53,290 - INFO - Finished converting document 4_2024-02-06 in 0.05 sec.
2025-11-14 17:17:53,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,346 - INFO - Going to convert document batch...
2025-11-14 17:17:53,347 - INFO - Processing document 4_2024-02-15
2025-11-14 17:17:53,379 - INFO - Finished converting document 4_2024-02-15 in 0.06 sec.


Converted 'data\edgar_documents\MMM\4_2024-02-05' --> 'data\processed_data\MMM\4_2024-02-05.md'
Converted 'data\edgar_documents\MMM\4_2024-02-06' --> 'data\processed_data\MMM\4_2024-02-06.md'
Converted 'data\edgar_documents\MMM\4_2024-02-15' --> 'data\processed_data\MMM\4_2024-02-15.md'


2025-11-14 17:17:53,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,437 - INFO - Going to convert document batch...
2025-11-14 17:17:53,437 - INFO - Processing document 4_2024-03-26
2025-11-14 17:17:53,455 - INFO - Finished converting document 4_2024-03-26 in 0.05 sec.
2025-11-14 17:17:53,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,512 - INFO - Going to convert document batch...
2025-11-14 17:17:53,512 - INFO - Processing document 4_2024-04-03
2025-11-14 17:17:53,530 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 17:17:53,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,577 - INFO - Going to convert document batch...
2025-11-14 17:17:53,578 - INFO - Processing document 4_2024-05-03
2025-11-14 17:17:53,600 - INFO - Finished converting document 4_2024-05-03 in 0.05 sec.
2025-11-14 17:17:53,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\4_2024-03-26' --> 'data\processed_data\MMM\4_2024-03-26.md'
Converted 'data\edgar_documents\MMM\4_2024-04-03' --> 'data\processed_data\MMM\4_2024-04-03.md'
Converted 'data\edgar_documents\MMM\4_2024-05-03' --> 'data\processed_data\MMM\4_2024-05-03.md'


2025-11-14 17:17:53,664 - INFO - Going to convert document batch...
2025-11-14 17:17:53,664 - INFO - Processing document 4_2024-05-06
2025-11-14 17:17:53,684 - INFO - Finished converting document 4_2024-05-06 in 0.06 sec.
2025-11-14 17:17:53,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,755 - INFO - Going to convert document batch...
2025-11-14 17:17:53,757 - INFO - Processing document 4_2024-05-08
2025-11-14 17:17:53,780 - INFO - Finished converting document 4_2024-05-08 in 0.08 sec.
2025-11-14 17:17:53,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,829 - INFO - Going to convert document batch...
2025-11-14 17:17:53,830 - INFO - Processing document 4_2024-05-14
2025-11-14 17:17:53,852 - INFO - Finished converting document 4_2024-05-14 in 0.05 sec.
2025-11-14 17:17:53,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\4_2024-05-06' --> 'data\processed_data\MMM\4_2024-05-06.md'
Converted 'data\edgar_documents\MMM\4_2024-05-08' --> 'data\processed_data\MMM\4_2024-05-08.md'
Converted 'data\edgar_documents\MMM\4_2024-05-14' --> 'data\processed_data\MMM\4_2024-05-14.md'


2025-11-14 17:17:53,901 - INFO - Going to convert document batch...
2025-11-14 17:17:53,902 - INFO - Processing document 4_2024-05-15
2025-11-14 17:17:53,920 - INFO - Finished converting document 4_2024-05-15 in 0.05 sec.
2025-11-14 17:17:53,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:53,972 - INFO - Going to convert document batch...
2025-11-14 17:17:53,972 - INFO - Processing document 4_2024-07-01
2025-11-14 17:17:53,993 - INFO - Finished converting document 4_2024-07-01 in 0.05 sec.
2025-11-14 17:17:54,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:54,050 - INFO - Going to convert document batch...
2025-11-14 17:17:54,051 - INFO - Processing document 4_2024-07-02
2025-11-14 17:17:54,073 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.
2025-11-14 17:17:54,121 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\4_2024-05-15' --> 'data\processed_data\MMM\4_2024-05-15.md'
Converted 'data\edgar_documents\MMM\4_2024-07-01' --> 'data\processed_data\MMM\4_2024-07-01.md'
Converted 'data\edgar_documents\MMM\4_2024-07-02' --> 'data\processed_data\MMM\4_2024-07-02.md'


2025-11-14 17:17:54,133 - INFO - Going to convert document batch...
2025-11-14 17:17:54,134 - INFO - Processing document 4_2024-08-02
2025-11-14 17:17:54,153 - INFO - Finished converting document 4_2024-08-02 in 0.06 sec.
2025-11-14 17:17:54,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:54,204 - INFO - Going to convert document batch...
2025-11-14 17:17:54,205 - INFO - Processing document 4_2024-08-07
2025-11-14 17:17:54,222 - INFO - Finished converting document 4_2024-08-07 in 0.05 sec.
2025-11-14 17:17:54,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:54,271 - INFO - Going to convert document batch...
2025-11-14 17:17:54,272 - INFO - Processing document 4_2024-08-08
2025-11-14 17:17:54,291 - INFO - Finished converting document 4_2024-08-08 in 0.06 sec.
2025-11-14 17:17:54,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:54,344 - INFO - Going to convert document batch...
2025-11-14 17:17:54,345 - 

Converted 'data\edgar_documents\MMM\4_2024-08-02' --> 'data\processed_data\MMM\4_2024-08-02.md'
Converted 'data\edgar_documents\MMM\4_2024-08-07' --> 'data\processed_data\MMM\4_2024-08-07.md'
Converted 'data\edgar_documents\MMM\4_2024-08-08' --> 'data\processed_data\MMM\4_2024-08-08.md'


2025-11-14 17:17:54,768 - INFO - Finished converting document 4_2024-10-02 in 0.45 sec.
2025-11-14 17:17:54,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:54,821 - INFO - Going to convert document batch...
2025-11-14 17:17:54,822 - INFO - Processing document 4_2024-10-17
2025-11-14 17:17:54,856 - INFO - Finished converting document 4_2024-10-17 in 0.08 sec.
2025-11-14 17:17:54,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:54,920 - INFO - Going to convert document batch...
2025-11-14 17:17:54,921 - INFO - Processing document 4_2024-11-04
2025-11-14 17:17:54,944 - INFO - Finished converting document 4_2024-11-04 in 0.05 sec.


Converted 'data\edgar_documents\MMM\4_2024-10-02' --> 'data\processed_data\MMM\4_2024-10-02.md'
Converted 'data\edgar_documents\MMM\4_2024-10-17' --> 'data\processed_data\MMM\4_2024-10-17.md'


2025-11-14 17:17:54,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:54,998 - INFO - Going to convert document batch...
2025-11-14 17:17:54,999 - INFO - Processing document 4_2024-11-21
2025-11-14 17:17:55,019 - INFO - Finished converting document 4_2024-11-21 in 0.05 sec.
2025-11-14 17:17:55,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:55,076 - INFO - Going to convert document batch...
2025-11-14 17:17:55,077 - INFO - Processing document 4_2024-12-02
2025-11-14 17:17:55,099 - INFO - Finished converting document 4_2024-12-02 in 0.06 sec.
2025-11-14 17:17:55,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:55,155 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MMM\4_2024-11-04' --> 'data\processed_data\MMM\4_2024-11-04.md'
Converted 'data\edgar_documents\MMM\4_2024-11-21' --> 'data\processed_data\MMM\4_2024-11-21.md'
Converted 'data\edgar_documents\MMM\4_2024-12-02' --> 'data\processed_data\MMM\4_2024-12-02.md'


2025-11-14 17:17:55,156 - INFO - Processing document 4_2025-01-27
2025-11-14 17:17:55,187 - INFO - Finished converting document 4_2025-01-27 in 0.06 sec.
2025-11-14 17:17:55,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:55,264 - INFO - Going to convert document batch...
2025-11-14 17:17:55,265 - INFO - Processing document 4_2025-01-28
2025-11-14 17:17:55,285 - INFO - Finished converting document 4_2025-01-28 in 0.05 sec.
2025-11-14 17:17:55,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:55,356 - INFO - Going to convert document batch...
2025-11-14 17:17:55,357 - INFO - Processing document 4_2025-01-30
2025-11-14 17:17:55,397 - INFO - Finished converting document 4_2025-01-30 in 0.09 sec.


Converted 'data\edgar_documents\MMM\4_2025-01-27' --> 'data\processed_data\MMM\4_2025-01-27.md'
Converted 'data\edgar_documents\MMM\4_2025-01-28' --> 'data\processed_data\MMM\4_2025-01-28.md'
Converted 'data\edgar_documents\MMM\4_2025-01-30' --> 'data\processed_data\MMM\4_2025-01-30.md'


2025-11-14 17:17:55,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:55,466 - INFO - Going to convert document batch...
2025-11-14 17:17:55,467 - INFO - Processing document 4_2025-02-03
2025-11-14 17:17:55,487 - INFO - Finished converting document 4_2025-02-03 in 0.05 sec.
2025-11-14 17:17:55,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:55,528 - INFO - Going to convert document batch...
2025-11-14 17:17:55,528 - INFO - Processing document 4_2025-02-05
2025-11-14 17:17:55,549 - INFO - Finished converting document 4_2025-02-05 in 0.05 sec.
2025-11-14 17:17:55,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:55,592 - INFO - Going to convert document batch...
2025-11-14 17:17:55,593 - INFO - Processing document 4_2025-02-10
2025-11-14 17:17:55,612 - INFO - Finished converting document 4_2025-02-10 in 0.05 sec.
2025-11-14 17:17:55,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\MMM\4_2025-02-03' --> 'data\processed_data\MMM\4_2025-02-03.md'
Converted 'data\edgar_documents\MMM\4_2025-02-05' --> 'data\processed_data\MMM\4_2025-02-05.md'
Converted 'data\edgar_documents\MMM\4_2025-02-10' --> 'data\processed_data\MMM\4_2025-02-10.md'


2025-11-14 17:17:55,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:55,734 - INFO - Going to convert document batch...
2025-11-14 17:17:55,734 - INFO - Processing document 4_2025-02-18
2025-11-14 17:17:55,756 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 17:17:55,818 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:17:55,819 - ERROR - Input document 4_2025-03-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:17

Converted 'data\edgar_documents\MMM\4_2025-02-13' --> 'data\processed_data\MMM\4_2025-02-13.md'
Converted 'data\edgar_documents\MMM\4_2025-02-18' --> 'data\processed_data\MMM\4_2025-02-18.md'
Error processing data\edgar_documents\MMM\4_2025-03-04: File format not allowed: data\edgar_documents\MMM\4_2025-03-04
Error processing data\edgar_documents\MMM\4_2025-03-05: File format not allowed: data\edgar_documents\MMM\4_2025-03-05


2025-11-14 17:17:55,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:55,973 - INFO - Going to convert document batch...
2025-11-14 17:17:55,974 - INFO - Processing document 4_2025-05-05
2025-11-14 17:17:55,998 - INFO - Finished converting document 4_2025-05-05 in 0.06 sec.
2025-11-14 17:17:56,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,063 - INFO - Going to convert document batch...
2025-11-14 17:17:56,064 - INFO - Processing document 4_2025-05-14
2025-11-14 17:17:56,082 - INFO - Finished converting document 4_2025-05-14 in 0.06 sec.


Converted 'data\edgar_documents\MMM\4_2025-04-28' --> 'data\processed_data\MMM\4_2025-04-28.md'
Converted 'data\edgar_documents\MMM\4_2025-05-05' --> 'data\processed_data\MMM\4_2025-05-05.md'
Converted 'data\edgar_documents\MMM\4_2025-05-14' --> 'data\processed_data\MMM\4_2025-05-14.md'


2025-11-14 17:17:56,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,158 - INFO - Going to convert document batch...
2025-11-14 17:17:56,159 - INFO - Processing document 4_2025-05-19
2025-11-14 17:17:56,193 - INFO - Finished converting document 4_2025-05-19 in 0.08 sec.
2025-11-14 17:17:56,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,257 - INFO - Going to convert document batch...
2025-11-14 17:17:56,258 - INFO - Processing document 4_2025-05-21
2025-11-14 17:17:56,277 - INFO - Finished converting document 4_2025-05-21 in 0.06 sec.
2025-11-14 17:17:56,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,356 - INFO - Going to convert document batch...
2025-11-14 17:17:56,357 - INFO - Processing document 4_2025-05-27
2025-11-14 17:17:56,381 - INFO - Finished converting document 4_2025-05-27 in 0.08 sec.
2025-11-14 17:17:56,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\4_2025-05-19' --> 'data\processed_data\MMM\4_2025-05-19.md'
Converted 'data\edgar_documents\MMM\4_2025-05-21' --> 'data\processed_data\MMM\4_2025-05-21.md'
Converted 'data\edgar_documents\MMM\4_2025-05-27' --> 'data\processed_data\MMM\4_2025-05-27.md'


2025-11-14 17:17:56,440 - INFO - Going to convert document batch...
2025-11-14 17:17:56,441 - INFO - Processing document 4_2025-06-03
2025-11-14 17:17:56,463 - INFO - Finished converting document 4_2025-06-03 in 0.05 sec.
2025-11-14 17:17:56,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,514 - INFO - Going to convert document batch...
2025-11-14 17:17:56,515 - INFO - Processing document 4_2025-07-02
2025-11-14 17:17:56,538 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 17:17:56,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,579 - INFO - Going to convert document batch...
2025-11-14 17:17:56,580 - INFO - Processing document 4_2025-07-23
2025-11-14 17:17:56,601 - INFO - Finished converting document 4_2025-07-23 in 0.03 sec.
2025-11-14 17:17:56,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,642 - INFO - Going to convert document batch...
2025-11-14 17:17:56,642 - 

Converted 'data\edgar_documents\MMM\4_2025-06-03' --> 'data\processed_data\MMM\4_2025-06-03.md'
Converted 'data\edgar_documents\MMM\4_2025-07-02' --> 'data\processed_data\MMM\4_2025-07-02.md'
Converted 'data\edgar_documents\MMM\4_2025-07-23' --> 'data\processed_data\MMM\4_2025-07-23.md'


2025-11-14 17:17:56,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,702 - INFO - Going to convert document batch...
2025-11-14 17:17:56,703 - INFO - Processing document 4_2025-08-08
2025-11-14 17:17:56,725 - INFO - Finished converting document 4_2025-08-08 in 0.03 sec.
2025-11-14 17:17:56,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,784 - INFO - Going to convert document batch...
2025-11-14 17:17:56,784 - INFO - Processing document 4_2025-08-18
2025-11-14 17:17:56,802 - INFO - Finished converting document 4_2025-08-18 in 0.05 sec.
2025-11-14 17:17:56,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,840 - INFO - Going to convert document batch...
2025-11-14 17:17:56,840 - INFO - Processing document 4_2025-10-02
2025-11-14 17:17:56,862 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.


Converted 'data\edgar_documents\MMM\4_2025-08-06' --> 'data\processed_data\MMM\4_2025-08-06.md'
Converted 'data\edgar_documents\MMM\4_2025-08-08' --> 'data\processed_data\MMM\4_2025-08-08.md'
Converted 'data\edgar_documents\MMM\4_2025-08-18' --> 'data\processed_data\MMM\4_2025-08-18.md'


2025-11-14 17:17:56,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,903 - INFO - Going to convert document batch...
2025-11-14 17:17:56,904 - INFO - Processing document 4_2025-10-27
2025-11-14 17:17:56,925 - INFO - Finished converting document 4_2025-10-27 in 0.05 sec.
2025-11-14 17:17:56,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:56,980 - INFO - Going to convert document batch...
2025-11-14 17:17:56,981 - INFO - Processing document 4_2025-10-30
2025-11-14 17:17:57,020 - INFO - Finished converting document 4_2025-10-30 in 0.08 sec.
2025-11-14 17:17:57,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\4_2025-10-02' --> 'data\processed_data\MMM\4_2025-10-02.md'
Converted 'data\edgar_documents\MMM\4_2025-10-27' --> 'data\processed_data\MMM\4_2025-10-27.md'
Converted 'data\edgar_documents\MMM\4_2025-10-30' --> 'data\processed_data\MMM\4_2025-10-30.md'


2025-11-14 17:17:57,082 - INFO - Going to convert document batch...
2025-11-14 17:17:57,083 - INFO - Processing document 4_2025-11-03
2025-11-14 17:17:57,102 - INFO - Finished converting document 4_2025-11-03 in 0.05 sec.
2025-11-14 17:17:57,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,173 - INFO - Going to convert document batch...
2025-11-14 17:17:57,174 - INFO - Processing document 8-K_2023-01-24
2025-11-14 17:17:57,203 - INFO - Finished converting document 8-K_2023-01-24 in 0.08 sec.
2025-11-14 17:17:57,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,244 - INFO - Going to convert document batch...
2025-11-14 17:17:57,245 - INFO - Processing document 8-K_2023-02-08
2025-11-14 17:17:57,263 - INFO - Finished converting document 8-K_2023-02-08 in 0.05 sec.
2025-11-14 17:17:57,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,305 - INFO - Going to convert document batch...
2025-11-14 17:17:5

Converted 'data\edgar_documents\MMM\4_2025-11-03' --> 'data\processed_data\MMM\4_2025-11-03.md'
Converted 'data\edgar_documents\MMM\8-K_2023-01-24' --> 'data\processed_data\MMM\8-K_2023-01-24.md'
Converted 'data\edgar_documents\MMM\8-K_2023-02-08' --> 'data\processed_data\MMM\8-K_2023-02-08.md'


2025-11-14 17:17:57,328 - INFO - Finished converting document 8-K_2023-02-21 in 0.06 sec.
2025-11-14 17:17:57,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,375 - INFO - Going to convert document batch...
2025-11-14 17:17:57,376 - INFO - Processing document 8-K_2023-04-25
2025-11-14 17:17:57,394 - INFO - Finished converting document 8-K_2023-04-25 in 0.05 sec.
2025-11-14 17:17:57,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,449 - INFO - Going to convert document batch...
2025-11-14 17:17:57,450 - INFO - Processing document 8-K_2023-05-11
2025-11-14 17:17:57,473 - INFO - Finished converting document 8-K_2023-05-11 in 0.06 sec.
2025-11-14 17:17:57,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,512 - INFO - Going to convert document batch...
2025-11-14 17:17:57,512 - INFO - Processing document 8-K_2023-05-15
2025-11-14 17:17:57,529 - INFO - Finished converting document 8-K_2023-05-15 in 0.

Converted 'data\edgar_documents\MMM\8-K_2023-02-21' --> 'data\processed_data\MMM\8-K_2023-02-21.md'
Converted 'data\edgar_documents\MMM\8-K_2023-04-25' --> 'data\processed_data\MMM\8-K_2023-04-25.md'
Converted 'data\edgar_documents\MMM\8-K_2023-05-11' --> 'data\processed_data\MMM\8-K_2023-05-11.md'


2025-11-14 17:17:57,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,571 - INFO - Going to convert document batch...
2025-11-14 17:17:57,572 - INFO - Processing document 8-K_2023-06-22
2025-11-14 17:17:57,633 - INFO - Finished converting document 8-K_2023-06-22 in 0.09 sec.
2025-11-14 17:17:57,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,706 - INFO - Going to convert document batch...
2025-11-14 17:17:57,706 - INFO - Processing document 8-K_2023-07-10
2025-11-14 17:17:57,724 - INFO - Finished converting document 8-K_2023-07-10 in 0.05 sec.


Converted 'data\edgar_documents\MMM\8-K_2023-05-15' --> 'data\processed_data\MMM\8-K_2023-05-15.md'
Converted 'data\edgar_documents\MMM\8-K_2023-06-22' --> 'data\processed_data\MMM\8-K_2023-06-22.md'


2025-11-14 17:17:57,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,774 - INFO - Going to convert document batch...
2025-11-14 17:17:57,775 - INFO - Processing document 8-K_2023-07-25
2025-11-14 17:17:57,792 - INFO - Finished converting document 8-K_2023-07-25 in 0.06 sec.
2025-11-14 17:17:57,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,848 - INFO - Going to convert document batch...
2025-11-14 17:17:57,849 - INFO - Processing document 8-K_2023-08-11
2025-11-14 17:17:57,870 - INFO - Finished converting document 8-K_2023-08-11 in 0.08 sec.
2025-11-14 17:17:57,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,915 - INFO - Going to convert document batch...
2025-11-14 17:17:57,916 - INFO - Processing document 8-K_2023-08-22


Converted 'data\edgar_documents\MMM\8-K_2023-07-10' --> 'data\processed_data\MMM\8-K_2023-07-10.md'
Converted 'data\edgar_documents\MMM\8-K_2023-07-25' --> 'data\processed_data\MMM\8-K_2023-07-25.md'
Converted 'data\edgar_documents\MMM\8-K_2023-08-11' --> 'data\processed_data\MMM\8-K_2023-08-11.md'


2025-11-14 17:17:57,935 - INFO - Finished converting document 8-K_2023-08-22 in 0.06 sec.
2025-11-14 17:17:57,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:57,991 - INFO - Going to convert document batch...
2025-11-14 17:17:57,993 - INFO - Processing document 8-K_2023-08-29
2025-11-14 17:17:58,024 - INFO - Finished converting document 8-K_2023-08-29 in 0.08 sec.
2025-11-14 17:17:58,071 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:58,085 - INFO - Going to convert document batch...
2025-11-14 17:17:58,086 - INFO - Processing document 8-K_2023-09-18
2025-11-14 17:17:58,104 - INFO - Finished converting document 8-K_2023-09-18 in 0.06 sec.
2025-11-14 17:17:58,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\8-K_2023-08-22' --> 'data\processed_data\MMM\8-K_2023-08-22.md'
Converted 'data\edgar_documents\MMM\8-K_2023-08-29' --> 'data\processed_data\MMM\8-K_2023-08-29.md'
Converted 'data\edgar_documents\MMM\8-K_2023-09-18' --> 'data\processed_data\MMM\8-K_2023-09-18.md'


2025-11-14 17:17:58,147 - INFO - Going to convert document batch...
2025-11-14 17:17:58,148 - INFO - Processing document 8-K_2023-09-25
2025-11-14 17:17:58,165 - INFO - Finished converting document 8-K_2023-09-25 in 0.05 sec.
2025-11-14 17:17:58,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:58,205 - INFO - Going to convert document batch...
2025-11-14 17:17:58,206 - INFO - Processing document 8-K_2023-10-24
2025-11-14 17:17:58,223 - INFO - Finished converting document 8-K_2023-10-24 in 0.05 sec.
2025-11-14 17:17:58,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:58,259 - INFO - Going to convert document batch...
2025-11-14 17:17:58,260 - INFO - Processing document 8-K_2023-11-07
2025-11-14 17:17:58,277 - INFO - Finished converting document 8-K_2023-11-07 in 0.05 sec.
2025-11-14 17:17:58,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:58,310 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\MMM\8-K_2023-09-25' --> 'data\processed_data\MMM\8-K_2023-09-25.md'
Converted 'data\edgar_documents\MMM\8-K_2023-10-24' --> 'data\processed_data\MMM\8-K_2023-10-24.md'
Converted 'data\edgar_documents\MMM\8-K_2023-11-07' --> 'data\processed_data\MMM\8-K_2023-11-07.md'
Converted 'data\edgar_documents\MMM\8-K_2023-11-09' --> 'data\processed_data\MMM\8-K_2023-11-09.md'


2025-11-14 17:17:58,362 - INFO - Processing document 8-K_2023-11-21
2025-11-14 17:17:58,380 - INFO - Finished converting document 8-K_2023-11-21 in 0.05 sec.
2025-11-14 17:17:58,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:58,420 - INFO - Going to convert document batch...
2025-11-14 17:17:58,421 - INFO - Processing document 8-K_2024-01-16
2025-11-14 17:17:58,439 - INFO - Finished converting document 8-K_2024-01-16 in 0.05 sec.
2025-11-14 17:17:58,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:58,513 - INFO - Going to convert document batch...
2025-11-14 17:17:58,515 - INFO - Processing document 8-K_2024-01-23
2025-11-14 17:17:58,532 - INFO - Finished converting document 8-K_2024-01-23 in 0.06 sec.
2025-11-14 17:17:58,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:58,577 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MMM\8-K_2023-11-21' --> 'data\processed_data\MMM\8-K_2023-11-21.md'
Converted 'data\edgar_documents\MMM\8-K_2024-01-16' --> 'data\processed_data\MMM\8-K_2024-01-16.md'
Converted 'data\edgar_documents\MMM\8-K_2024-01-23' --> 'data\processed_data\MMM\8-K_2024-01-23.md'


2025-11-14 17:17:58,577 - INFO - Processing document 8-K_2024-01-29
2025-11-14 17:17:58,598 - INFO - Finished converting document 8-K_2024-01-29 in 0.05 sec.
2025-11-14 17:17:58,627 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:17:58,628 - ERROR - Input document 8-K_2024-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:17:58,629 - INFO - Going to convert document batch...
2025-11-14 17:17:58,642 - INFO - detected formats: [<I

Converted 'data\edgar_documents\MMM\8-K_2024-01-29' --> 'data\processed_data\MMM\8-K_2024-01-29.md'
Error processing data\edgar_documents\MMM\8-K_2024-02-27: File format not allowed: data\edgar_documents\MMM\8-K_2024-02-27
Converted 'data\edgar_documents\MMM\8-K_2024-03-08' --> 'data\processed_data\MMM\8-K_2024-03-08.md'
Converted 'data\edgar_documents\MMM\8-K_2024-03-12' --> 'data\processed_data\MMM\8-K_2024-03-12.md'
Converted 'data\edgar_documents\MMM\8-K_2024-04-04' --> 'data\processed_data\MMM\8-K_2024-04-04.md'


2025-11-14 17:17:58,820 - INFO - Going to convert document batch...
2025-11-14 17:17:58,820 - INFO - Processing document 8-K_2024-04-30
2025-11-14 17:17:58,836 - INFO - Finished converting document 8-K_2024-04-30 in 0.05 sec.
2025-11-14 17:17:58,889 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\8-K_2024-04-30' --> 'data\processed_data\MMM\8-K_2024-04-30.md'


2025-11-14 17:17:59,118 - INFO - Going to convert document batch...
2025-11-14 17:17:59,119 - INFO - Processing document 8-K_2024-05-16
2025-11-14 17:17:59,145 - INFO - Finished converting document 8-K_2024-05-16 in 0.30 sec.
2025-11-14 17:17:59,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,206 - INFO - Going to convert document batch...
2025-11-14 17:17:59,208 - INFO - Processing document 8-K_2024-06-13
2025-11-14 17:17:59,233 - INFO - Finished converting document 8-K_2024-06-13 in 0.06 sec.
2025-11-14 17:17:59,276 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,295 - INFO - Going to convert document batch...
2025-11-14 17:17:59,296 - INFO - Processing document 8-K_2024-07-10
2025-11-14 17:17:59,315 - INFO - Finished converting document 8-K_2024-07-10 in 0.08 sec.
2025-11-14 17:17:59,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\8-K_2024-05-16' --> 'data\processed_data\MMM\8-K_2024-05-16.md'
Converted 'data\edgar_documents\MMM\8-K_2024-06-13' --> 'data\processed_data\MMM\8-K_2024-06-13.md'
Converted 'data\edgar_documents\MMM\8-K_2024-07-10' --> 'data\processed_data\MMM\8-K_2024-07-10.md'


2025-11-14 17:17:59,364 - INFO - Going to convert document batch...
2025-11-14 17:17:59,365 - INFO - Processing document 8-K_2024-07-26
2025-11-14 17:17:59,381 - INFO - Finished converting document 8-K_2024-07-26 in 0.05 sec.
2025-11-14 17:17:59,419 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,431 - INFO - Going to convert document batch...
2025-11-14 17:17:59,432 - INFO - Processing document 8-K_2024-08-01
2025-11-14 17:17:59,452 - INFO - Finished converting document 8-K_2024-08-01 in 0.06 sec.
2025-11-14 17:17:59,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,504 - INFO - Going to convert document batch...
2025-11-14 17:17:59,505 - INFO - Processing document 8-K_2024-08-20
2025-11-14 17:17:59,519 - INFO - Finished converting document 8-K_2024-08-20 in 0.05 sec.
2025-11-14 17:17:59,560 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,571 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\MMM\8-K_2024-07-26' --> 'data\processed_data\MMM\8-K_2024-07-26.md'
Converted 'data\edgar_documents\MMM\8-K_2024-08-01' --> 'data\processed_data\MMM\8-K_2024-08-01.md'
Converted 'data\edgar_documents\MMM\8-K_2024-08-20' --> 'data\processed_data\MMM\8-K_2024-08-20.md'


2025-11-14 17:17:59,588 - INFO - Finished converting document 8-K_2024-10-22 in 0.03 sec.
2025-11-14 17:17:59,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,639 - INFO - Going to convert document batch...
2025-11-14 17:17:59,640 - INFO - Processing document 8-K_2025-01-21
2025-11-14 17:17:59,657 - INFO - Finished converting document 8-K_2025-01-21 in 0.06 sec.
2025-11-14 17:17:59,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,739 - INFO - Going to convert document batch...
2025-11-14 17:17:59,740 - INFO - Processing document 8-K_2025-02-10
2025-11-14 17:17:59,757 - INFO - Finished converting document 8-K_2025-02-10 in 0.08 sec.


Converted 'data\edgar_documents\MMM\8-K_2024-10-22' --> 'data\processed_data\MMM\8-K_2024-10-22.md'
Converted 'data\edgar_documents\MMM\8-K_2025-01-21' --> 'data\processed_data\MMM\8-K_2025-01-21.md'
Converted 'data\edgar_documents\MMM\8-K_2025-02-10' --> 'data\processed_data\MMM\8-K_2025-02-10.md'


2025-11-14 17:17:59,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,831 - INFO - Going to convert document batch...
2025-11-14 17:17:59,832 - INFO - Processing document 8-K_2025-02-21
2025-11-14 17:17:59,848 - INFO - Finished converting document 8-K_2025-02-21 in 0.08 sec.
2025-11-14 17:17:59,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,883 - INFO - Going to convert document batch...
2025-11-14 17:17:59,884 - INFO - Processing document 8-K_2025-02-26
2025-11-14 17:17:59,911 - INFO - Finished converting document 8-K_2025-02-26 in 0.05 sec.
2025-11-14 17:17:59,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:17:59,952 - INFO - Going to convert document batch...
2025-11-14 17:17:59,953 - INFO - Processing document 8-K_2025-03-13
2025-11-14 17:17:59,989 - INFO - Finished converting document 8-K_2025-03-13 in 0.06 sec.


Converted 'data\edgar_documents\MMM\8-K_2025-02-21' --> 'data\processed_data\MMM\8-K_2025-02-21.md'
Converted 'data\edgar_documents\MMM\8-K_2025-02-26' --> 'data\processed_data\MMM\8-K_2025-02-26.md'
Converted 'data\edgar_documents\MMM\8-K_2025-03-13' --> 'data\processed_data\MMM\8-K_2025-03-13.md'


2025-11-14 17:18:00,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:00,070 - INFO - Going to convert document batch...
2025-11-14 17:18:00,070 - INFO - Processing document 8-K_2025-04-22
2025-11-14 17:18:00,088 - INFO - Finished converting document 8-K_2025-04-22 in 0.05 sec.
2025-11-14 17:18:00,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:00,141 - INFO - Going to convert document batch...
2025-11-14 17:18:00,142 - INFO - Processing document 8-K_2025-05-12
2025-11-14 17:18:00,161 - INFO - Finished converting document 8-K_2025-05-12 in 0.06 sec.
2025-11-14 17:18:00,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:00,204 - INFO - Going to convert document batch...
2025-11-14 17:18:00,205 - INFO - Processing document 8-K_2025-05-14
2025-11-14 17:18:00,229 - INFO - Finished converting document 8-K_2025-05-14 in 0.06 sec.
2025-11-14 17:18:00,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\MMM\8-K_2025-04-22' --> 'data\processed_data\MMM\8-K_2025-04-22.md'
Converted 'data\edgar_documents\MMM\8-K_2025-05-12' --> 'data\processed_data\MMM\8-K_2025-05-12.md'
Converted 'data\edgar_documents\MMM\8-K_2025-05-14' --> 'data\processed_data\MMM\8-K_2025-05-14.md'


2025-11-14 17:18:00,283 - INFO - Processing document 8-K_2025-07-18
2025-11-14 17:18:00,301 - INFO - Finished converting document 8-K_2025-07-18 in 0.06 sec.
2025-11-14 17:18:00,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:00,360 - INFO - Going to convert document batch...
2025-11-14 17:18:00,362 - INFO - Processing document 8-K_2025-08-15
2025-11-14 17:18:00,380 - INFO - Finished converting document 8-K_2025-08-15 in 0.06 sec.
2025-11-14 17:18:00,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:00,421 - INFO - Going to convert document batch...
2025-11-14 17:18:00,421 - INFO - Processing document 8-K_2025-10-21
2025-11-14 17:18:00,439 - INFO - Finished converting document 8-K_2025-10-21 in 0.05 sec.
2025-11-14 17:18:00,501 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\MMM\8-K_2025-07-18' --> 'data\processed_data\MMM\8-K_2025-07-18.md'
Converted 'data\edgar_documents\MMM\8-K_2025-08-15' --> 'data\processed_data\MMM\8-K_2025-08-15.md'
Converted 'data\edgar_documents\MMM\8-K_2025-10-21' --> 'data\processed_data\MMM\8-K_2025-10-21.md'


2025-11-14 17:18:00,501 - ERROR - Input document DEF-14A_2023-03-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:18:00,504 - INFO - Going to convert document batch...
2025-11-14 17:18:00,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\MMM\DEF-14A_2023-03-22: File format not allowed: data\edgar_documents\MMM\DEF-14A_2023-03-22


2025-11-14 17:18:01,457 - INFO - Going to convert document batch...
2025-11-14 17:18:01,458 - INFO - Processing document DEF-14A_2024-03-27
2025-11-14 17:18:06,660 - INFO - Finished converting document DEF-14A_2024-03-27 in 6.16 sec.
2025-11-14 17:18:08,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\DEF-14A_2024-03-27' --> 'data\processed_data\MMM\DEF-14A_2024-03-27.md'


2025-11-14 17:18:08,978 - INFO - Going to convert document batch...
2025-11-14 17:18:08,979 - INFO - Processing document DEF-14A_2025-03-26
2025-11-14 17:18:13,253 - INFO - Finished converting document DEF-14A_2025-03-26 in 5.20 sec.
2025-11-14 17:18:14,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MMM\DEF-14A_2025-03-26' --> 'data\processed_data\MMM\DEF-14A_2025-03-26.md'
Processed 120 new files. Errors: 7
Found 88 files to process in data\edgar_documents\MO


2025-11-14 17:18:15,665 - INFO - Going to convert document batch...
2025-11-14 17:18:15,665 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:18:15,667 - INFO - Processing document 10-K_2023-02-27
2025-11-14 17:18:17,155 - INFO - Finished converting document 10-K_2023-02-27 in 2.69 sec.
2025-11-14 17:18:17,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:17,767 - INFO - Going to convert document batch...
2025-11-14 17:18:17,768 - INFO - Processing document 10-K_2023-06-01
2025-11-14 17:18:17,789 - INFO - Finished converting document 10-K_2023-06-01 in 0.05 sec.
2025-11-14 17:18:17,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-K_2023-02-27' --> 'data\processed_data\MO\10-K_2023-02-27.md'
Converted 'data\edgar_documents\MO\10-K_2023-06-01' --> 'data\processed_data\MO\10-K_2023-06-01.md'


2025-11-14 17:18:18,748 - INFO - Going to convert document batch...
2025-11-14 17:18:18,748 - INFO - Processing document 10-K_2024-02-27
2025-11-14 17:18:20,396 - INFO - Finished converting document 10-K_2024-02-27 in 2.58 sec.
2025-11-14 17:18:20,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:20,997 - INFO - Going to convert document batch...
2025-11-14 17:18:20,998 - INFO - Processing document 10-K_2024-06-05
2025-11-14 17:18:21,021 - INFO - Finished converting document 10-K_2024-06-05 in 0.05 sec.
2025-11-14 17:18:21,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-K_2024-02-27' --> 'data\processed_data\MO\10-K_2024-02-27.md'
Converted 'data\edgar_documents\MO\10-K_2024-06-05' --> 'data\processed_data\MO\10-K_2024-06-05.md'


2025-11-14 17:18:21,813 - INFO - Going to convert document batch...
2025-11-14 17:18:21,814 - INFO - Processing document 10-K_2025-02-26
2025-11-14 17:18:23,663 - INFO - Finished converting document 10-K_2025-02-26 in 2.62 sec.
2025-11-14 17:18:24,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:24,278 - INFO - Going to convert document batch...
2025-11-14 17:18:24,279 - INFO - Processing document 10-K_2025-06-04
2025-11-14 17:18:24,301 - INFO - Finished converting document 10-K_2025-06-04 in 0.05 sec.
2025-11-14 17:18:24,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-K_2025-02-26' --> 'data\processed_data\MO\10-K_2025-02-26.md'
Converted 'data\edgar_documents\MO\10-K_2025-06-04' --> 'data\processed_data\MO\10-K_2025-06-04.md'


2025-11-14 17:18:24,698 - INFO - Going to convert document batch...
2025-11-14 17:18:24,699 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 17:18:25,339 - INFO - Finished converting document 10-Q_2023-04-27 in 1.03 sec.
2025-11-14 17:18:25,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-Q_2023-04-27' --> 'data\processed_data\MO\10-Q_2023-04-27.md'


2025-11-14 17:18:26,434 - INFO - Going to convert document batch...
2025-11-14 17:18:26,435 - INFO - Processing document 10-Q_2023-08-01
2025-11-14 17:18:27,320 - INFO - Finished converting document 10-Q_2023-08-01 in 1.69 sec.
2025-11-14 17:18:27,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-Q_2023-08-01' --> 'data\processed_data\MO\10-Q_2023-08-01.md'


2025-11-14 17:18:28,590 - INFO - Going to convert document batch...
2025-11-14 17:18:28,591 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 17:18:29,463 - INFO - Finished converting document 10-Q_2023-10-26 in 1.72 sec.
2025-11-14 17:18:29,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-Q_2023-10-26' --> 'data\processed_data\MO\10-Q_2023-10-26.md'


2025-11-14 17:18:30,280 - INFO - Going to convert document batch...
2025-11-14 17:18:30,281 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 17:18:30,942 - INFO - Finished converting document 10-Q_2024-04-25 in 1.03 sec.
2025-11-14 17:18:31,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-Q_2024-04-25' --> 'data\processed_data\MO\10-Q_2024-04-25.md'


2025-11-14 17:18:32,168 - INFO - Going to convert document batch...
2025-11-14 17:18:32,170 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 17:18:33,066 - INFO - Finished converting document 10-Q_2024-07-31 in 1.80 sec.
2025-11-14 17:18:33,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-Q_2024-07-31' --> 'data\processed_data\MO\10-Q_2024-07-31.md'


2025-11-14 17:18:34,310 - INFO - Going to convert document batch...
2025-11-14 17:18:34,311 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 17:18:35,234 - INFO - Finished converting document 10-Q_2024-10-31 in 1.75 sec.
2025-11-14 17:18:35,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-Q_2024-10-31' --> 'data\processed_data\MO\10-Q_2024-10-31.md'


2025-11-14 17:18:36,067 - INFO - Going to convert document batch...
2025-11-14 17:18:36,068 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 17:18:36,776 - INFO - Finished converting document 10-Q_2025-04-29 in 1.11 sec.
2025-11-14 17:18:37,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-Q_2025-04-29' --> 'data\processed_data\MO\10-Q_2025-04-29.md'


2025-11-14 17:18:37,987 - INFO - Going to convert document batch...
2025-11-14 17:18:37,988 - INFO - Processing document 10-Q_2025-07-30
2025-11-14 17:18:38,904 - INFO - Finished converting document 10-Q_2025-07-30 in 1.80 sec.
2025-11-14 17:18:39,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\10-Q_2025-07-30' --> 'data\processed_data\MO\10-Q_2025-07-30.md'


2025-11-14 17:18:40,195 - INFO - Going to convert document batch...
2025-11-14 17:18:40,195 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 17:18:41,119 - INFO - Finished converting document 10-Q_2025-10-30 in 1.75 sec.
2025-11-14 17:18:41,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:41,603 - INFO - Going to convert document batch...
2025-11-14 17:18:41,604 - INFO - Processing document 4_2023-01-04
2025-11-14 17:18:41,623 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 17:18:41,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:41,667 - INFO - Going to convert document batch...
2025-11-14 17:18:41,668 - INFO - Processing document 4_2023-02-13
2025-11-14 17:18:41,688 - INFO - Finished converting document 4_2023-02-13 in 0.05 sec.
2025-11-14 17:18:41,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:41,731 - INFO - Going to convert document batch...
2025-11-14 17:18:41,

Converted 'data\edgar_documents\MO\10-Q_2025-10-30' --> 'data\processed_data\MO\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\MO\4_2023-01-04' --> 'data\processed_data\MO\4_2023-01-04.md'
Converted 'data\edgar_documents\MO\4_2023-02-13' --> 'data\processed_data\MO\4_2023-02-13.md'


2025-11-14 17:18:41,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:41,800 - INFO - Going to convert document batch...
2025-11-14 17:18:41,801 - INFO - Processing document 4_2023-03-01
2025-11-14 17:18:41,822 - INFO - Finished converting document 4_2023-03-01 in 0.03 sec.
2025-11-14 17:18:41,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:41,864 - INFO - Going to convert document batch...
2025-11-14 17:18:41,866 - INFO - Processing document 4_2023-03-02
2025-11-14 17:18:41,893 - INFO - Finished converting document 4_2023-03-02 in 0.05 sec.
2025-11-14 17:18:41,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:41,950 - INFO - Going to convert document batch...
2025-11-14 17:18:41,951 - INFO - Processing document 4_2023-04-04
2025-11-14 17:18:41,973 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.


Converted 'data\edgar_documents\MO\4_2023-02-17' --> 'data\processed_data\MO\4_2023-02-17.md'
Converted 'data\edgar_documents\MO\4_2023-03-01' --> 'data\processed_data\MO\4_2023-03-01.md'
Converted 'data\edgar_documents\MO\4_2023-03-02' --> 'data\processed_data\MO\4_2023-03-02.md'


2025-11-14 17:18:42,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:42,034 - INFO - Going to convert document batch...
2025-11-14 17:18:42,035 - INFO - Processing document 4_2023-05-17
2025-11-14 17:18:42,063 - INFO - Finished converting document 4_2023-05-17 in 0.06 sec.
2025-11-14 17:18:42,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:42,123 - INFO - Going to convert document batch...
2025-11-14 17:18:42,125 - INFO - Processing document 4_2023-05-22
2025-11-14 17:18:42,158 - INFO - Finished converting document 4_2023-05-22 in 0.06 sec.
2025-11-14 17:18:42,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\4_2023-04-04' --> 'data\processed_data\MO\4_2023-04-04.md'
Converted 'data\edgar_documents\MO\4_2023-05-17' --> 'data\processed_data\MO\4_2023-05-17.md'
Converted 'data\edgar_documents\MO\4_2023-05-22' --> 'data\processed_data\MO\4_2023-05-22.md'


2025-11-14 17:18:42,210 - INFO - Going to convert document batch...
2025-11-14 17:18:42,210 - INFO - Processing document 4_2023-06-05
2025-11-14 17:18:42,236 - INFO - Finished converting document 4_2023-06-05 in 0.05 sec.
2025-11-14 17:18:42,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:42,291 - INFO - Going to convert document batch...
2025-11-14 17:18:42,292 - INFO - Processing document 4_2023-07-05
2025-11-14 17:18:42,313 - INFO - Finished converting document 4_2023-07-05 in 0.05 sec.
2025-11-14 17:18:42,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:42,360 - INFO - Going to convert document batch...
2025-11-14 17:18:42,361 - INFO - Processing document 4_2023-10-03
2025-11-14 17:18:42,382 - INFO - Finished converting document 4_2023-10-03 in 0.03 sec.
2025-11-14 17:18:42,425 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:18:42,426 - ERROR - Input document 4_2023-10-30 with format None does 

Converted 'data\edgar_documents\MO\4_2023-06-05' --> 'data\processed_data\MO\4_2023-06-05.md'
Converted 'data\edgar_documents\MO\4_2023-07-05' --> 'data\processed_data\MO\4_2023-07-05.md'
Converted 'data\edgar_documents\MO\4_2023-10-03' --> 'data\processed_data\MO\4_2023-10-03.md'
Error processing data\edgar_documents\MO\4_2023-10-30: File format not allowed: data\edgar_documents\MO\4_2023-10-30


2025-11-14 17:18:42,449 - ERROR - Input document 4_2023-10-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:18:42,450 - INFO - Going to convert document batch...
2025-11-14 17:18:42,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:42,472 - INFO - Going to convert document batch...
2025-11-14 17:18:42,473 - INFO - Processing document 4_2023-11-01
2025-11-14 17:18:42,492 - INFO - Finished converting document 4_2023-11-01 in 0.03 sec.
2025-11-14 17:18:42,546 - INFO - detec

Error processing data\edgar_documents\MO\4_2023-10-31: File format not allowed: data\edgar_documents\MO\4_2023-10-31
Converted 'data\edgar_documents\MO\4_2023-11-01' --> 'data\processed_data\MO\4_2023-11-01.md'
Converted 'data\edgar_documents\MO\4_2023-11-08' --> 'data\processed_data\MO\4_2023-11-08.md'


2025-11-14 17:18:42,637 - INFO - Processing document 4_2023-11-14
2025-11-14 17:18:42,672 - INFO - Finished converting document 4_2023-11-14 in 0.08 sec.
2025-11-14 17:18:42,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:42,722 - INFO - Going to convert document batch...
2025-11-14 17:18:42,724 - INFO - Processing document 4_2024-01-03
2025-11-14 17:18:42,754 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 17:18:42,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:42,799 - INFO - Going to convert document batch...
2025-11-14 17:18:42,799 - INFO - Processing document 4_2024-02-20
2025-11-14 17:18:42,819 - INFO - Finished converting document 4_2024-02-20 in 0.03 sec.
2025-11-14 17:18:42,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:42,861 - INFO - Going to convert document batch...
2025-11-14 17:18:42,862 - INFO - Processing document 4_2024-02-29
2025-11-14 17:18:42,881 - IN

Converted 'data\edgar_documents\MO\4_2023-11-14' --> 'data\processed_data\MO\4_2023-11-14.md'
Converted 'data\edgar_documents\MO\4_2024-01-03' --> 'data\processed_data\MO\4_2024-01-03.md'
Converted 'data\edgar_documents\MO\4_2024-02-20' --> 'data\processed_data\MO\4_2024-02-20.md'
Converted 'data\edgar_documents\MO\4_2024-02-29' --> 'data\processed_data\MO\4_2024-02-29.md'


2025-11-14 17:18:42,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:42,937 - INFO - Going to convert document batch...
2025-11-14 17:18:42,938 - INFO - Processing document 4_2024-03-01
2025-11-14 17:18:42,961 - INFO - Finished converting document 4_2024-03-01 in 0.05 sec.
2025-11-14 17:18:42,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:43,006 - INFO - Going to convert document batch...
2025-11-14 17:18:43,006 - INFO - Processing document 4_2024-04-02
2025-11-14 17:18:43,029 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 17:18:43,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:43,090 - INFO - Going to convert document batch...
2025-11-14 17:18:43,090 - INFO - Processing document 4_2024-04-03
2025-11-14 17:18:43,108 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 17:18:43,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\MO\4_2024-03-01' --> 'data\processed_data\MO\4_2024-03-01.md'
Converted 'data\edgar_documents\MO\4_2024-04-02' --> 'data\processed_data\MO\4_2024-04-02.md'
Converted 'data\edgar_documents\MO\4_2024-04-03' --> 'data\processed_data\MO\4_2024-04-03.md'


2025-11-14 17:18:43,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:43,206 - INFO - Going to convert document batch...
2025-11-14 17:18:43,207 - INFO - Processing document 4_2024-05-20
2025-11-14 17:18:43,228 - INFO - Finished converting document 4_2024-05-20 in 0.03 sec.
2025-11-14 17:18:43,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:43,275 - INFO - Going to convert document batch...
2025-11-14 17:18:43,277 - INFO - Processing document 4_2024-07-02
2025-11-14 17:18:43,319 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.


Converted 'data\edgar_documents\MO\4_2024-05-06' --> 'data\processed_data\MO\4_2024-05-06.md'
Converted 'data\edgar_documents\MO\4_2024-05-20' --> 'data\processed_data\MO\4_2024-05-20.md'
Converted 'data\edgar_documents\MO\4_2024-07-02' --> 'data\processed_data\MO\4_2024-07-02.md'


2025-11-14 17:18:43,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:43,389 - INFO - Going to convert document batch...
2025-11-14 17:18:43,390 - INFO - Processing document 4_2024-10-02
2025-11-14 17:18:43,410 - INFO - Finished converting document 4_2024-10-02 in 0.06 sec.
2025-11-14 17:18:43,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:43,455 - INFO - Going to convert document batch...
2025-11-14 17:18:43,455 - INFO - Processing document 4_2024-12-12
2025-11-14 17:18:43,474 - INFO - Finished converting document 4_2024-12-12 in 0.03 sec.
2025-11-14 17:18:43,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:43,514 - INFO - Going to convert document batch...
2025-11-14 17:18:43,515 - INFO - Processing document 4_2025-01-03
2025-11-14 17:18:43,536 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 17:18:43,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\MO\4_2024-10-02' --> 'data\processed_data\MO\4_2024-10-02.md'
Converted 'data\edgar_documents\MO\4_2024-12-12' --> 'data\processed_data\MO\4_2024-12-12.md'
Converted 'data\edgar_documents\MO\4_2025-01-03' --> 'data\processed_data\MO\4_2025-01-03.md'
Converted 'data\edgar_documents\MO\4_2025-01-30' --> 'data\processed_data\MO\4_2025-01-30.md'


2025-11-14 17:18:43,669 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:18:43,670 - ERROR - Input document 4_2025-02-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:18:43,672 - INFO - Going to convert document batch...
2025-11-14 17:18:43,694 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:18:43,695 - ERROR - Input document 4_2025-02-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\MO\4_2025-02-04: File format not allowed: data\edgar_documents\MO\4_2025-02-04
Error processing data\edgar_documents\MO\4_2025-02-05: File format not allowed: data\edgar_documents\MO\4_2025-02-05
Converted 'data\edgar_documents\MO\4_2025-02-19' --> 'data\processed_data\MO\4_2025-02-19.md'
Converted 'data\edgar_documents\MO\4_2025-02-28' --> 'data\processed_data\MO\4_2025-02-28.md'


2025-11-14 17:18:43,858 - INFO - Processing document 4_2025-03-03
2025-11-14 17:18:43,877 - INFO - Finished converting document 4_2025-03-03 in 0.06 sec.
2025-11-14 17:18:43,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:43,921 - INFO - Going to convert document batch...
2025-11-14 17:18:43,922 - INFO - Processing document 4_2025-04-18
2025-11-14 17:18:43,942 - INFO - Finished converting document 4_2025-04-18 in 0.05 sec.
2025-11-14 17:18:43,977 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:43,984 - INFO - Going to convert document batch...
2025-11-14 17:18:43,985 - INFO - Processing document 4_2025-05-19
2025-11-14 17:18:44,004 - INFO - Finished converting document 4_2025-05-19 in 0.03 sec.
2025-11-14 17:18:44,045 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:18:44,045 - ERROR - Input document 4_2025-08-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>

Converted 'data\edgar_documents\MO\4_2025-03-03' --> 'data\processed_data\MO\4_2025-03-03.md'
Converted 'data\edgar_documents\MO\4_2025-04-18' --> 'data\processed_data\MO\4_2025-04-18.md'
Converted 'data\edgar_documents\MO\4_2025-05-19' --> 'data\processed_data\MO\4_2025-05-19.md'
Error processing data\edgar_documents\MO\4_2025-08-04: File format not allowed: data\edgar_documents\MO\4_2025-08-04
Error processing data\edgar_documents\MO\4_2025-08-05: File format not allowed: data\edgar_documents\MO\4_2025-08-05


2025-11-14 17:18:44,087 - INFO - Going to convert document batch...
2025-11-14 17:18:44,088 - INFO - Processing document 4_2025-08-25
2025-11-14 17:18:44,108 - INFO - Finished converting document 4_2025-08-25 in 0.05 sec.
2025-11-14 17:18:44,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,162 - INFO - Going to convert document batch...
2025-11-14 17:18:44,163 - INFO - Processing document 8-K_2023-02-01
2025-11-14 17:18:44,184 - INFO - Finished converting document 8-K_2023-02-01 in 0.06 sec.
2025-11-14 17:18:44,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,227 - INFO - Going to convert document batch...
2025-11-14 17:18:44,228 - INFO - Processing document 8-K_2023-03-06
2025-11-14 17:18:44,250 - INFO - Finished converting document 8-K_2023-03-06 in 0.06 sec.
2025-11-14 17:18:44,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,286 - INFO - Going to convert document batch...
2025-11-14 17:18:4

Converted 'data\edgar_documents\MO\4_2025-08-25' --> 'data\processed_data\MO\4_2025-08-25.md'
Converted 'data\edgar_documents\MO\8-K_2023-02-01' --> 'data\processed_data\MO\8-K_2023-02-01.md'
Converted 'data\edgar_documents\MO\8-K_2023-03-06' --> 'data\processed_data\MO\8-K_2023-03-06.md'


2025-11-14 17:18:44,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,342 - INFO - Going to convert document batch...
2025-11-14 17:18:44,343 - INFO - Processing document 8-K_2023-04-27
2025-11-14 17:18:44,362 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 17:18:44,391 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,405 - INFO - Going to convert document batch...
2025-11-14 17:18:44,405 - INFO - Processing document 8-K_2023-05-10
2025-11-14 17:18:44,423 - INFO - Finished converting document 8-K_2023-05-10 in 0.05 sec.
2025-11-14 17:18:44,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,468 - INFO - Going to convert document batch...
2025-11-14 17:18:44,469 - INFO - Processing document 8-K_2023-05-22
2025-11-14 17:18:44,507 - INFO - Finished converting document 8-K_2023-05-22 in 0.06 sec.


Converted 'data\edgar_documents\MO\8-K_2023-03-23' --> 'data\processed_data\MO\8-K_2023-03-23.md'
Converted 'data\edgar_documents\MO\8-K_2023-04-27' --> 'data\processed_data\MO\8-K_2023-04-27.md'
Converted 'data\edgar_documents\MO\8-K_2023-05-10' --> 'data\processed_data\MO\8-K_2023-05-10.md'


2025-11-14 17:18:44,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,555 - INFO - Going to convert document batch...
2025-11-14 17:18:44,556 - INFO - Processing document 8-K_2023-06-01
2025-11-14 17:18:44,579 - INFO - Finished converting document 8-K_2023-06-01 in 0.05 sec.
2025-11-14 17:18:44,605 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,622 - INFO - Going to convert document batch...
2025-11-14 17:18:44,623 - INFO - Processing document 8-K_2023-08-01
2025-11-14 17:18:44,644 - INFO - Finished converting document 8-K_2023-08-01 in 0.05 sec.
2025-11-14 17:18:44,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,704 - INFO - Going to convert document batch...
2025-11-14 17:18:44,704 - INFO - Processing document 8-K_2023-08-24


Converted 'data\edgar_documents\MO\8-K_2023-05-22' --> 'data\processed_data\MO\8-K_2023-05-22.md'
Converted 'data\edgar_documents\MO\8-K_2023-06-01' --> 'data\processed_data\MO\8-K_2023-06-01.md'
Converted 'data\edgar_documents\MO\8-K_2023-08-01' --> 'data\processed_data\MO\8-K_2023-08-01.md'


2025-11-14 17:18:44,719 - INFO - Finished converting document 8-K_2023-08-24 in 0.06 sec.
2025-11-14 17:18:44,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,754 - INFO - Going to convert document batch...
2025-11-14 17:18:44,755 - INFO - Processing document 8-K_2023-10-25
2025-11-14 17:18:44,780 - INFO - Finished converting document 8-K_2023-10-25 in 0.06 sec.
2025-11-14 17:18:44,806 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,819 - INFO - Going to convert document batch...
2025-11-14 17:18:44,819 - INFO - Processing document 8-K_2023-10-26
2025-11-14 17:18:44,837 - INFO - Finished converting document 8-K_2023-10-26 in 0.03 sec.
2025-11-14 17:18:44,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,871 - INFO - Going to convert document batch...
2025-11-14 17:18:44,872 - INFO - Processing document 8-K_2023-11-01
2025-11-14 17:18:44,893 - INFO - Finished converting document 8-K_2023-11-01 in 0.

Converted 'data\edgar_documents\MO\8-K_2023-08-24' --> 'data\processed_data\MO\8-K_2023-08-24.md'
Converted 'data\edgar_documents\MO\8-K_2023-10-25' --> 'data\processed_data\MO\8-K_2023-10-25.md'
Converted 'data\edgar_documents\MO\8-K_2023-10-26' --> 'data\processed_data\MO\8-K_2023-10-26.md'
Converted 'data\edgar_documents\MO\8-K_2023-11-01' --> 'data\processed_data\MO\8-K_2023-11-01.md'


2025-11-14 17:18:44,932 - INFO - Going to convert document batch...
2025-11-14 17:18:44,933 - INFO - Processing document 8-K_2024-02-01
2025-11-14 17:18:44,952 - INFO - Finished converting document 8-K_2024-02-01 in 0.05 sec.
2025-11-14 17:18:44,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:44,991 - INFO - Going to convert document batch...
2025-11-14 17:18:44,991 - INFO - Processing document 8-K_2024-02-26
2025-11-14 17:18:45,010 - INFO - Finished converting document 8-K_2024-02-26 in 0.03 sec.
2025-11-14 17:18:45,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:45,040 - INFO - Going to convert document batch...
2025-11-14 17:18:45,041 - INFO - Processing document 8-K_2024-02-28
2025-11-14 17:18:45,057 - INFO - Finished converting document 8-K_2024-02-28 in 0.05 sec.
2025-11-14 17:18:45,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:45,112 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\MO\8-K_2024-02-01' --> 'data\processed_data\MO\8-K_2024-02-01.md'
Converted 'data\edgar_documents\MO\8-K_2024-02-26' --> 'data\processed_data\MO\8-K_2024-02-26.md'
Converted 'data\edgar_documents\MO\8-K_2024-02-28' --> 'data\processed_data\MO\8-K_2024-02-28.md'
Converted 'data\edgar_documents\MO\8-K_2024-03-14' --> 'data\processed_data\MO\8-K_2024-03-14.md'


2025-11-14 17:18:45,162 - INFO - Going to convert document batch...
2025-11-14 17:18:45,162 - INFO - Processing document 8-K_2024-03-19
2025-11-14 17:18:45,182 - INFO - Finished converting document 8-K_2024-03-19 in 0.05 sec.
2025-11-14 17:18:45,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:45,219 - INFO - Going to convert document batch...
2025-11-14 17:18:45,220 - INFO - Processing document 8-K_2024-04-25
2025-11-14 17:18:45,239 - INFO - Finished converting document 8-K_2024-04-25 in 0.05 sec.
2025-11-14 17:18:45,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:45,280 - INFO - Going to convert document batch...
2025-11-14 17:18:45,281 - INFO - Processing document 8-K_2024-05-20
2025-11-14 17:18:45,313 - INFO - Finished converting document 8-K_2024-05-20 in 0.06 sec.
2025-11-14 17:18:45,343 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:45,352 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\MO\8-K_2024-03-19' --> 'data\processed_data\MO\8-K_2024-03-19.md'
Converted 'data\edgar_documents\MO\8-K_2024-04-25' --> 'data\processed_data\MO\8-K_2024-04-25.md'
Converted 'data\edgar_documents\MO\8-K_2024-05-20' --> 'data\processed_data\MO\8-K_2024-05-20.md'


2025-11-14 17:18:45,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:45,405 - INFO - Going to convert document batch...
2025-11-14 17:18:45,405 - INFO - Processing document 8-K_2024-10-31
2025-11-14 17:18:45,426 - INFO - Finished converting document 8-K_2024-10-31 in 0.05 sec.
2025-11-14 17:18:45,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:45,461 - INFO - Going to convert document batch...
2025-11-14 17:18:45,462 - INFO - Processing document 8-K_2025-01-30
2025-11-14 17:18:45,482 - INFO - Finished converting document 8-K_2025-01-30 in 0.05 sec.
2025-11-14 17:18:45,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:45,520 - INFO - Going to convert document batch...
2025-11-14 17:18:45,521 - INFO - Processing document 8-K_2025-02-06


Converted 'data\edgar_documents\MO\8-K_2024-07-31' --> 'data\processed_data\MO\8-K_2024-07-31.md'
Converted 'data\edgar_documents\MO\8-K_2024-10-31' --> 'data\processed_data\MO\8-K_2024-10-31.md'
Converted 'data\edgar_documents\MO\8-K_2025-01-30' --> 'data\processed_data\MO\8-K_2025-01-30.md'


2025-11-14 17:18:45,928 - INFO - Finished converting document 8-K_2025-02-06 in 0.42 sec.
2025-11-14 17:18:45,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:45,962 - INFO - Going to convert document batch...
2025-11-14 17:18:45,964 - INFO - Processing document 8-K_2025-04-29
2025-11-14 17:18:45,983 - INFO - Finished converting document 8-K_2025-04-29 in 0.05 sec.
2025-11-14 17:18:46,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:46,026 - INFO - Going to convert document batch...
2025-11-14 17:18:46,027 - INFO - Processing document 8-K_2025-05-19
2025-11-14 17:18:46,062 - INFO - Finished converting document 8-K_2025-05-19 in 0.08 sec.
2025-11-14 17:18:46,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:46,133 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MO\8-K_2025-02-06' --> 'data\processed_data\MO\8-K_2025-02-06.md'
Converted 'data\edgar_documents\MO\8-K_2025-04-29' --> 'data\processed_data\MO\8-K_2025-04-29.md'
Converted 'data\edgar_documents\MO\8-K_2025-05-19' --> 'data\processed_data\MO\8-K_2025-05-19.md'


2025-11-14 17:18:46,133 - INFO - Processing document 8-K_2025-06-03
2025-11-14 17:18:46,153 - INFO - Finished converting document 8-K_2025-06-03 in 0.08 sec.
2025-11-14 17:18:46,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:46,191 - INFO - Going to convert document batch...
2025-11-14 17:18:46,192 - INFO - Processing document 8-K_2025-07-23
2025-11-14 17:18:46,211 - INFO - Finished converting document 8-K_2025-07-23 in 0.05 sec.
2025-11-14 17:18:46,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:46,245 - INFO - Going to convert document batch...
2025-11-14 17:18:46,246 - INFO - Processing document 8-K_2025-07-30
2025-11-14 17:18:46,264 - INFO - Finished converting document 8-K_2025-07-30 in 0.05 sec.
2025-11-14 17:18:46,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:46,301 - INFO - Going to convert document batch...
2025-11-14 17:18:46,301 - INFO - Processing document 8-K_2025-08-06
2025-11-14 17:

Converted 'data\edgar_documents\MO\8-K_2025-06-03' --> 'data\processed_data\MO\8-K_2025-06-03.md'
Converted 'data\edgar_documents\MO\8-K_2025-07-23' --> 'data\processed_data\MO\8-K_2025-07-23.md'
Converted 'data\edgar_documents\MO\8-K_2025-07-30' --> 'data\processed_data\MO\8-K_2025-07-30.md'
Converted 'data\edgar_documents\MO\8-K_2025-08-06' --> 'data\processed_data\MO\8-K_2025-08-06.md'


2025-11-14 17:18:46,359 - INFO - Going to convert document batch...
2025-11-14 17:18:46,359 - INFO - Processing document 8-K_2025-10-09
2025-11-14 17:18:46,378 - INFO - Finished converting document 8-K_2025-10-09 in 0.05 sec.
2025-11-14 17:18:46,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:18:46,412 - INFO - Going to convert document batch...
2025-11-14 17:18:46,413 - INFO - Processing document 8-K_2025-10-30
2025-11-14 17:18:46,432 - INFO - Finished converting document 8-K_2025-10-30 in 0.05 sec.
2025-11-14 17:18:46,477 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:18:46,478 - ERROR - Input document DEF-14A_2023-04-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputForm

Converted 'data\edgar_documents\MO\8-K_2025-10-09' --> 'data\processed_data\MO\8-K_2025-10-09.md'
Converted 'data\edgar_documents\MO\8-K_2025-10-30' --> 'data\processed_data\MO\8-K_2025-10-30.md'
Error processing data\edgar_documents\MO\DEF-14A_2023-04-06: File format not allowed: data\edgar_documents\MO\DEF-14A_2023-04-06


2025-11-14 17:18:47,484 - INFO - Going to convert document batch...
2025-11-14 17:18:47,486 - INFO - Processing document DEF-14A_2024-04-04
2025-11-14 17:18:56,421 - INFO - Finished converting document DEF-14A_2024-04-04 in 9.94 sec.
2025-11-14 17:18:57,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\DEF-14A_2024-04-04' --> 'data\processed_data\MO\DEF-14A_2024-04-04.md'


2025-11-14 17:18:58,563 - INFO - Going to convert document batch...
2025-11-14 17:18:58,564 - INFO - Processing document DEF-14A_2025-04-03
2025-11-14 17:19:08,743 - INFO - Finished converting document DEF-14A_2025-04-03 in 11.33 sec.
2025-11-14 17:19:09,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MO\DEF-14A_2025-04-03' --> 'data\processed_data\MO\DEF-14A_2025-04-03.md'
Processed 81 new files. Errors: 7
Found 101 files to process in data\edgar_documents\MRK


2025-11-14 17:19:10,931 - INFO - Going to convert document batch...
2025-11-14 17:19:10,931 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:19:10,933 - INFO - Processing document 10-K_2023-02-24
2025-11-14 17:19:13,540 - INFO - Finished converting document 10-K_2023-02-24 in 3.83 sec.
2025-11-14 17:19:14,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-K_2023-02-24' --> 'data\processed_data\MRK\10-K_2023-02-24.md'


2025-11-14 17:19:15,778 - INFO - Going to convert document batch...
2025-11-14 17:19:15,783 - INFO - Processing document 10-K_2024-02-26
2025-11-14 17:19:17,993 - INFO - Finished converting document 10-K_2024-02-26 in 3.69 sec.
2025-11-14 17:19:18,737 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:19:18,738 - ERROR - Input document 10-K_2024-04-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:19:18,739 - INFO - Going to convert d

Converted 'data\edgar_documents\MRK\10-K_2024-02-26' --> 'data\processed_data\MRK\10-K_2024-02-26.md'
Error processing data\edgar_documents\MRK\10-K_2024-04-11: File format not allowed: data\edgar_documents\MRK\10-K_2024-04-11


2025-11-14 17:19:20,488 - INFO - Going to convert document batch...
2025-11-14 17:19:20,488 - INFO - Processing document 10-K_2025-02-25
2025-11-14 17:19:22,657 - INFO - Finished converting document 10-K_2025-02-25 in 3.92 sec.
2025-11-14 17:19:23,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-K_2025-02-25' --> 'data\processed_data\MRK\10-K_2025-02-25.md'


2025-11-14 17:19:24,497 - INFO - Going to convert document batch...
2025-11-14 17:19:24,497 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 17:19:25,319 - INFO - Finished converting document 10-Q_2023-05-05 in 1.94 sec.
2025-11-14 17:19:25,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-Q_2023-05-05' --> 'data\processed_data\MRK\10-Q_2023-05-05.md'


2025-11-14 17:19:26,322 - INFO - Going to convert document batch...
2025-11-14 17:19:26,323 - INFO - Processing document 10-Q_2023-08-07
2025-11-14 17:19:27,409 - INFO - Finished converting document 10-Q_2023-08-07 in 1.72 sec.
2025-11-14 17:19:27,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-Q_2023-08-07' --> 'data\processed_data\MRK\10-Q_2023-08-07.md'


2025-11-14 17:19:29,149 - INFO - Going to convert document batch...
2025-11-14 17:19:29,150 - INFO - Processing document 10-Q_2023-11-03
2025-11-14 17:19:30,320 - INFO - Finished converting document 10-Q_2023-11-03 in 2.41 sec.
2025-11-14 17:19:30,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-Q_2023-11-03' --> 'data\processed_data\MRK\10-Q_2023-11-03.md'


2025-11-14 17:19:31,736 - INFO - Going to convert document batch...
2025-11-14 17:19:31,737 - INFO - Processing document 10-Q_2024-05-03
2025-11-14 17:19:32,589 - INFO - Finished converting document 10-Q_2024-05-03 in 1.77 sec.
2025-11-14 17:19:33,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-Q_2024-05-03' --> 'data\processed_data\MRK\10-Q_2024-05-03.md'


2025-11-14 17:19:34,005 - INFO - Going to convert document batch...
2025-11-14 17:19:34,005 - INFO - Processing document 10-Q_2024-08-05
2025-11-14 17:19:35,209 - INFO - Finished converting document 10-Q_2024-08-05 in 2.22 sec.
2025-11-14 17:19:35,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-Q_2024-08-05' --> 'data\processed_data\MRK\10-Q_2024-08-05.md'


2025-11-14 17:19:36,740 - INFO - Going to convert document batch...
2025-11-14 17:19:36,741 - INFO - Processing document 10-Q_2024-11-06
2025-11-14 17:19:37,956 - INFO - Finished converting document 10-Q_2024-11-06 in 2.22 sec.
2025-11-14 17:19:38,512 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-Q_2024-11-06' --> 'data\processed_data\MRK\10-Q_2024-11-06.md'


2025-11-14 17:19:38,953 - INFO - Going to convert document batch...
2025-11-14 17:19:38,954 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 17:19:40,305 - INFO - Finished converting document 10-Q_2025-05-02 in 1.83 sec.
2025-11-14 17:19:40,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-Q_2025-05-02' --> 'data\processed_data\MRK\10-Q_2025-05-02.md'


2025-11-14 17:19:41,384 - INFO - Going to convert document batch...
2025-11-14 17:19:41,385 - INFO - Processing document 10-Q_2025-08-05
2025-11-14 17:19:43,059 - INFO - Finished converting document 10-Q_2025-08-05 in 2.34 sec.
2025-11-14 17:19:43,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\10-Q_2025-08-05' --> 'data\processed_data\MRK\10-Q_2025-08-05.md'


2025-11-14 17:19:44,278 - INFO - Going to convert document batch...
2025-11-14 17:19:44,279 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 17:19:45,600 - INFO - Finished converting document 10-Q_2025-11-05 in 2.03 sec.
2025-11-14 17:19:46,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:46,152 - INFO - Going to convert document batch...
2025-11-14 17:19:46,153 - INFO - Processing document 4_2023-01-03
2025-11-14 17:19:46,171 - INFO - Finished converting document 4_2023-01-03 in 0.05 sec.
2025-11-14 17:19:46,206 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:46,219 - INFO - Going to convert document batch...
2025-11-14 17:19:46,220 - INFO - Processing document 4_2023-01-11
2025-11-14 17:19:46,248 - INFO - Finished converting document 4_2023-01-11 in 0.06 sec.
2025-11-14 17:19:46,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:46,294 - INFO - Going to convert document batch...
2025-11-14 17:19:46,

Converted 'data\edgar_documents\MRK\10-Q_2025-11-05' --> 'data\processed_data\MRK\10-Q_2025-11-05.md'
Converted 'data\edgar_documents\MRK\4_2023-01-03' --> 'data\processed_data\MRK\4_2023-01-03.md'
Converted 'data\edgar_documents\MRK\4_2023-01-11' --> 'data\processed_data\MRK\4_2023-01-11.md'


2025-11-14 17:19:46,752 - INFO - Finished converting document 4_2023-01-25 in 0.47 sec.
2025-11-14 17:19:46,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:46,794 - INFO - Going to convert document batch...
2025-11-14 17:19:46,795 - INFO - Processing document 4_2023-02-06
2025-11-14 17:19:46,816 - INFO - Finished converting document 4_2023-02-06 in 0.05 sec.
2025-11-14 17:19:46,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:46,857 - INFO - Going to convert document batch...
2025-11-14 17:19:46,857 - INFO - Processing document 4_2023-02-08
2025-11-14 17:19:46,874 - INFO - Finished converting document 4_2023-02-08 in 0.05 sec.
2025-11-14 17:19:46,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:46,913 - INFO - Going to convert document batch...
2025-11-14 17:19:46,914 - INFO - Processing document 4_2023-02-10
2025-11-14 17:19:46,929 - INFO - Finished converting document 4_2023-02-10 in 0.03 sec.
2025-1

Converted 'data\edgar_documents\MRK\4_2023-01-25' --> 'data\processed_data\MRK\4_2023-01-25.md'
Converted 'data\edgar_documents\MRK\4_2023-02-06' --> 'data\processed_data\MRK\4_2023-02-06.md'
Converted 'data\edgar_documents\MRK\4_2023-02-08' --> 'data\processed_data\MRK\4_2023-02-08.md'
Converted 'data\edgar_documents\MRK\4_2023-02-10' --> 'data\processed_data\MRK\4_2023-02-10.md'


2025-11-14 17:19:46,966 - INFO - Going to convert document batch...
2025-11-14 17:19:46,967 - INFO - Processing document 4_2023-02-13
2025-11-14 17:19:46,987 - INFO - Finished converting document 4_2023-02-13 in 0.05 sec.
2025-11-14 17:19:47,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:47,036 - INFO - Going to convert document batch...
2025-11-14 17:19:47,039 - INFO - Processing document 4_2023-02-14
2025-11-14 17:19:47,067 - INFO - Finished converting document 4_2023-02-14 in 0.06 sec.
2025-11-14 17:19:47,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:47,123 - INFO - Going to convert document batch...
2025-11-14 17:19:47,124 - INFO - Processing document 4_2023-02-16
2025-11-14 17:19:47,142 - INFO - Finished converting document 4_2023-02-16 in 0.05 sec.
2025-11-14 17:19:47,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:47,180 - INFO - Going to convert document batch...
2025-11-14 17:19:47,182 - 

Converted 'data\edgar_documents\MRK\4_2023-02-13' --> 'data\processed_data\MRK\4_2023-02-13.md'
Converted 'data\edgar_documents\MRK\4_2023-02-14' --> 'data\processed_data\MRK\4_2023-02-14.md'
Converted 'data\edgar_documents\MRK\4_2023-02-16' --> 'data\processed_data\MRK\4_2023-02-16.md'


2025-11-14 17:19:47,201 - INFO - Finished converting document 4_2023-04-03 in 0.05 sec.
2025-11-14 17:19:47,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:47,263 - INFO - Going to convert document batch...
2025-11-14 17:19:47,264 - INFO - Processing document 4_2023-04-14
2025-11-14 17:19:47,317 - INFO - Finished converting document 4_2023-04-14 in 0.08 sec.
2025-11-14 17:19:47,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:47,371 - INFO - Going to convert document batch...
2025-11-14 17:19:47,372 - INFO - Processing document 4_2023-04-28
2025-11-14 17:19:47,394 - INFO - Finished converting document 4_2023-04-28 in 0.05 sec.
2025-11-14 17:19:47,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MRK\4_2023-04-03' --> 'data\processed_data\MRK\4_2023-04-03.md'
Converted 'data\edgar_documents\MRK\4_2023-04-14' --> 'data\processed_data\MRK\4_2023-04-14.md'
Converted 'data\edgar_documents\MRK\4_2023-04-28' --> 'data\processed_data\MRK\4_2023-04-28.md'


2025-11-14 17:19:47,443 - INFO - Going to convert document batch...
2025-11-14 17:19:47,444 - INFO - Processing document 4_2023-05-02
2025-11-14 17:19:47,472 - INFO - Finished converting document 4_2023-05-02 in 0.05 sec.
2025-11-14 17:19:47,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:47,527 - INFO - Going to convert document batch...
2025-11-14 17:19:47,528 - INFO - Processing document 4_2023-05-03
2025-11-14 17:19:47,552 - INFO - Finished converting document 4_2023-05-03 in 0.05 sec.
2025-11-14 17:19:47,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:47,602 - INFO - Going to convert document batch...
2025-11-14 17:19:47,603 - INFO - Processing document 4_2023-05-04
2025-11-14 17:19:47,623 - INFO - Finished converting document 4_2023-05-04 in 0.05 sec.
2025-11-14 17:19:47,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:47,680 - INFO - Going to convert document batch...
2025-11-14 17:19:47,681 - 

Converted 'data\edgar_documents\MRK\4_2023-05-02' --> 'data\processed_data\MRK\4_2023-05-02.md'
Converted 'data\edgar_documents\MRK\4_2023-05-03' --> 'data\processed_data\MRK\4_2023-05-03.md'
Converted 'data\edgar_documents\MRK\4_2023-05-04' --> 'data\processed_data\MRK\4_2023-05-04.md'


2025-11-14 17:19:47,770 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:19:47,771 - ERROR - Input document 4_2023-05-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:19:47,772 - INFO - Going to convert document batch...
2025-11-14 17:19:47,791 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:19:47,792 - ERROR - Input document 4_2023-05-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\MRK\4_2023-05-05' --> 'data\processed_data\MRK\4_2023-05-05.md'
Error processing data\edgar_documents\MRK\4_2023-05-08: File format not allowed: data\edgar_documents\MRK\4_2023-05-08
Error processing data\edgar_documents\MRK\4_2023-05-10: File format not allowed: data\edgar_documents\MRK\4_2023-05-10
Converted 'data\edgar_documents\MRK\4_2023-05-31' --> 'data\processed_data\MRK\4_2023-05-31.md'


2025-11-14 17:19:47,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:47,969 - INFO - Going to convert document batch...
2025-11-14 17:19:47,970 - INFO - Processing document 4_2023-07-05
2025-11-14 17:19:47,994 - INFO - Finished converting document 4_2023-07-05 in 0.05 sec.
2025-11-14 17:19:48,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,042 - INFO - Going to convert document batch...
2025-11-14 17:19:48,043 - INFO - Processing document 4_2023-08-03
2025-11-14 17:19:48,062 - INFO - Finished converting document 4_2023-08-03 in 0.05 sec.
2025-11-14 17:19:48,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,101 - INFO - Going to convert document batch...
2025-11-14 17:19:48,102 - INFO - Processing document 4_2023-08-04
2025-11-14 17:19:48,125 - INFO - Finished converting document 4_2023-08-04 in 0.05 sec.


Converted 'data\edgar_documents\MRK\4_2023-06-30' --> 'data\processed_data\MRK\4_2023-06-30.md'
Converted 'data\edgar_documents\MRK\4_2023-07-05' --> 'data\processed_data\MRK\4_2023-07-05.md'
Converted 'data\edgar_documents\MRK\4_2023-08-03' --> 'data\processed_data\MRK\4_2023-08-03.md'


2025-11-14 17:19:48,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,166 - INFO - Going to convert document batch...
2025-11-14 17:19:48,167 - INFO - Processing document 4_2023-08-15
2025-11-14 17:19:48,184 - INFO - Finished converting document 4_2023-08-15 in 0.05 sec.
2025-11-14 17:19:48,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,225 - INFO - Going to convert document batch...
2025-11-14 17:19:48,226 - INFO - Processing document 4_2023-10-03
2025-11-14 17:19:48,245 - INFO - Finished converting document 4_2023-10-03 in 0.05 sec.
2025-11-14 17:19:48,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,286 - INFO - Going to convert document batch...
2025-11-14 17:19:48,287 - INFO - Processing document 4_2023-10-31
2025-11-14 17:19:48,307 - INFO - Finished converting document 4_2023-10-31 in 0.05 sec.


Converted 'data\edgar_documents\MRK\4_2023-08-04' --> 'data\processed_data\MRK\4_2023-08-04.md'
Converted 'data\edgar_documents\MRK\4_2023-08-15' --> 'data\processed_data\MRK\4_2023-08-15.md'
Converted 'data\edgar_documents\MRK\4_2023-10-03' --> 'data\processed_data\MRK\4_2023-10-03.md'


2025-11-14 17:19:48,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,349 - INFO - Going to convert document batch...
2025-11-14 17:19:48,350 - INFO - Processing document 4_2023-11-01
2025-11-14 17:19:48,383 - INFO - Finished converting document 4_2023-11-01 in 0.05 sec.
2025-11-14 17:19:48,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,439 - INFO - Going to convert document batch...
2025-11-14 17:19:48,440 - INFO - Processing document 4_2023-11-09
2025-11-14 17:19:48,460 - INFO - Finished converting document 4_2023-11-09 in 0.05 sec.
2025-11-14 17:19:48,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,500 - INFO - Going to convert document batch...
2025-11-14 17:19:48,501 - INFO - Processing document 4_2023-11-13
2025-11-14 17:19:48,519 - INFO - Finished converting document 4_2023-11-13 in 0.03 sec.


Converted 'data\edgar_documents\MRK\4_2023-10-31' --> 'data\processed_data\MRK\4_2023-10-31.md'
Converted 'data\edgar_documents\MRK\4_2023-11-01' --> 'data\processed_data\MRK\4_2023-11-01.md'
Converted 'data\edgar_documents\MRK\4_2023-11-09' --> 'data\processed_data\MRK\4_2023-11-09.md'


2025-11-14 17:19:48,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,560 - INFO - Going to convert document batch...
2025-11-14 17:19:48,561 - INFO - Processing document 4_2024-01-02
2025-11-14 17:19:48,584 - INFO - Finished converting document 4_2024-01-02 in 0.05 sec.
2025-11-14 17:19:48,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,650 - INFO - Going to convert document batch...
2025-11-14 17:19:48,651 - INFO - Processing document 4_2024-01-24
2025-11-14 17:19:48,669 - INFO - Finished converting document 4_2024-01-24 in 0.06 sec.
2025-11-14 17:19:48,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,712 - INFO - Going to convert document batch...
2025-11-14 17:19:48,712 - INFO - Processing document 4_2024-02-02


Converted 'data\edgar_documents\MRK\4_2023-11-13' --> 'data\processed_data\MRK\4_2023-11-13.md'
Converted 'data\edgar_documents\MRK\4_2024-01-02' --> 'data\processed_data\MRK\4_2024-01-02.md'
Converted 'data\edgar_documents\MRK\4_2024-01-24' --> 'data\processed_data\MRK\4_2024-01-24.md'


2025-11-14 17:19:48,736 - INFO - Finished converting document 4_2024-02-02 in 0.05 sec.
2025-11-14 17:19:48,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,784 - INFO - Going to convert document batch...
2025-11-14 17:19:48,785 - INFO - Processing document 4_2024-02-05
2025-11-14 17:19:48,810 - INFO - Finished converting document 4_2024-02-05 in 0.06 sec.
2025-11-14 17:19:48,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,868 - INFO - Going to convert document batch...
2025-11-14 17:19:48,869 - INFO - Processing document 4_2024-02-08
2025-11-14 17:19:48,887 - INFO - Finished converting document 4_2024-02-08 in 0.06 sec.
2025-11-14 17:19:48,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,929 - INFO - Going to convert document batch...
2025-11-14 17:19:48,929 - INFO - Processing document 4_2024-02-12
2025-11-14 17:19:48,951 - INFO - Finished converting document 4_2024-02-12 in 0.05 sec.


Converted 'data\edgar_documents\MRK\4_2024-02-02' --> 'data\processed_data\MRK\4_2024-02-02.md'
Converted 'data\edgar_documents\MRK\4_2024-02-05' --> 'data\processed_data\MRK\4_2024-02-05.md'
Converted 'data\edgar_documents\MRK\4_2024-02-08' --> 'data\processed_data\MRK\4_2024-02-08.md'


2025-11-14 17:19:48,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:48,994 - INFO - Going to convert document batch...
2025-11-14 17:19:48,995 - INFO - Processing document 4_2024-02-14
2025-11-14 17:19:49,013 - INFO - Finished converting document 4_2024-02-14 in 0.05 sec.
2025-11-14 17:19:49,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,056 - INFO - Going to convert document batch...
2025-11-14 17:19:49,057 - INFO - Processing document 4_2024-02-15
2025-11-14 17:19:49,080 - INFO - Finished converting document 4_2024-02-15 in 0.05 sec.
2025-11-14 17:19:49,114 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,125 - INFO - Going to convert document batch...
2025-11-14 17:19:49,126 - INFO - Processing document 4_2024-03-11
2025-11-14 17:19:49,153 - INFO - Finished converting document 4_2024-03-11 in 0.06 sec.


Converted 'data\edgar_documents\MRK\4_2024-02-12' --> 'data\processed_data\MRK\4_2024-02-12.md'
Converted 'data\edgar_documents\MRK\4_2024-02-14' --> 'data\processed_data\MRK\4_2024-02-14.md'
Converted 'data\edgar_documents\MRK\4_2024-02-15' --> 'data\processed_data\MRK\4_2024-02-15.md'


2025-11-14 17:19:49,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,198 - INFO - Going to convert document batch...
2025-11-14 17:19:49,199 - INFO - Processing document 4_2024-03-29
2025-11-14 17:19:49,219 - INFO - Finished converting document 4_2024-03-29 in 0.05 sec.
2025-11-14 17:19:49,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,266 - INFO - Going to convert document batch...
2025-11-14 17:19:49,267 - INFO - Processing document 4_2024-05-02
2025-11-14 17:19:49,294 - INFO - Finished converting document 4_2024-05-02 in 0.06 sec.
2025-11-14 17:19:49,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,339 - INFO - Going to convert document batch...
2025-11-14 17:19:49,339 - INFO - Processing document 4_2024-05-06


Converted 'data\edgar_documents\MRK\4_2024-03-11' --> 'data\processed_data\MRK\4_2024-03-11.md'
Converted 'data\edgar_documents\MRK\4_2024-03-29' --> 'data\processed_data\MRK\4_2024-03-29.md'
Converted 'data\edgar_documents\MRK\4_2024-05-02' --> 'data\processed_data\MRK\4_2024-05-02.md'


2025-11-14 17:19:49,370 - INFO - Finished converting document 4_2024-05-06 in 0.06 sec.
2025-11-14 17:19:49,415 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:19:49,415 - ERROR - Input document 4_2024-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:19:49,416 - INFO - Going to convert document batch...
2025-11-14 17:19:49,438 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:19:49,438 - ERROR - Input document 4_2024-05-20 with forma

Converted 'data\edgar_documents\MRK\4_2024-05-06' --> 'data\processed_data\MRK\4_2024-05-06.md'
Error processing data\edgar_documents\MRK\4_2024-05-15: File format not allowed: data\edgar_documents\MRK\4_2024-05-15
Error processing data\edgar_documents\MRK\4_2024-05-20: File format not allowed: data\edgar_documents\MRK\4_2024-05-20
Converted 'data\edgar_documents\MRK\4_2024-06-04' --> 'data\processed_data\MRK\4_2024-06-04.md'
Converted 'data\edgar_documents\MRK\4_2024-07-02' --> 'data\processed_data\MRK\4_2024-07-02.md'


2025-11-14 17:19:49,586 - INFO - Going to convert document batch...
2025-11-14 17:19:49,586 - INFO - Processing document 4_2024-08-06
2025-11-14 17:19:49,607 - INFO - Finished converting document 4_2024-08-06 in 0.05 sec.
2025-11-14 17:19:49,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,653 - INFO - Going to convert document batch...
2025-11-14 17:19:49,653 - INFO - Processing document 4_2024-10-01
2025-11-14 17:19:49,672 - INFO - Finished converting document 4_2024-10-01 in 0.05 sec.
2025-11-14 17:19:49,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,737 - INFO - Going to convert document batch...
2025-11-14 17:19:49,738 - INFO - Processing document 4_2025-01-03
2025-11-14 17:19:49,758 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 17:19:49,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,798 - INFO - Going to convert document batch...
2025-11-14 17:19:49,799 - 

Converted 'data\edgar_documents\MRK\4_2024-08-06' --> 'data\processed_data\MRK\4_2024-08-06.md'
Converted 'data\edgar_documents\MRK\4_2024-10-01' --> 'data\processed_data\MRK\4_2024-10-01.md'
Converted 'data\edgar_documents\MRK\4_2025-01-03' --> 'data\processed_data\MRK\4_2025-01-03.md'


2025-11-14 17:19:49,819 - INFO - Finished converting document 4_2025-01-29 in 0.03 sec.
2025-11-14 17:19:49,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,859 - INFO - Going to convert document batch...
2025-11-14 17:19:49,860 - INFO - Processing document 4_2025-02-07
2025-11-14 17:19:49,878 - INFO - Finished converting document 4_2025-02-07 in 0.03 sec.
2025-11-14 17:19:49,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,920 - INFO - Going to convert document batch...
2025-11-14 17:19:49,921 - INFO - Processing document 4_2025-02-11
2025-11-14 17:19:49,940 - INFO - Finished converting document 4_2025-02-11 in 0.05 sec.
2025-11-14 17:19:49,975 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:49,983 - INFO - Going to convert document batch...
2025-11-14 17:19:49,984 - INFO - Processing document 4_2025-02-13
2025-11-14 17:19:50,002 - INFO - Finished converting document 4_2025-02-13 in 0.03 sec.
2025-1

Converted 'data\edgar_documents\MRK\4_2025-01-29' --> 'data\processed_data\MRK\4_2025-01-29.md'
Converted 'data\edgar_documents\MRK\4_2025-02-07' --> 'data\processed_data\MRK\4_2025-02-07.md'
Converted 'data\edgar_documents\MRK\4_2025-02-11' --> 'data\processed_data\MRK\4_2025-02-11.md'
Converted 'data\edgar_documents\MRK\4_2025-02-13' --> 'data\processed_data\MRK\4_2025-02-13.md'


2025-11-14 17:19:50,039 - INFO - Going to convert document batch...
2025-11-14 17:19:50,039 - INFO - Processing document 4_2025-02-20
2025-11-14 17:19:50,057 - INFO - Finished converting document 4_2025-02-20 in 0.05 sec.
2025-11-14 17:19:50,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:50,099 - INFO - Going to convert document batch...
2025-11-14 17:19:50,100 - INFO - Processing document 4_2025-04-02
2025-11-14 17:19:50,142 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.
2025-11-14 17:19:50,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:50,184 - INFO - Going to convert document batch...
2025-11-14 17:19:50,185 - INFO - Processing document 4_2025-04-29
2025-11-14 17:19:50,207 - INFO - Finished converting document 4_2025-04-29 in 0.05 sec.
2025-11-14 17:19:50,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:50,245 - INFO - Going to convert document batch...
2025-11-14 17:19:50,246 - 

Converted 'data\edgar_documents\MRK\4_2025-02-20' --> 'data\processed_data\MRK\4_2025-02-20.md'
Converted 'data\edgar_documents\MRK\4_2025-04-02' --> 'data\processed_data\MRK\4_2025-04-02.md'
Converted 'data\edgar_documents\MRK\4_2025-04-29' --> 'data\processed_data\MRK\4_2025-04-29.md'


2025-11-14 17:19:50,267 - INFO - Finished converting document 4_2025-05-01 in 0.05 sec.
2025-11-14 17:19:50,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:50,313 - INFO - Going to convert document batch...
2025-11-14 17:19:50,314 - INFO - Processing document 4_2025-05-02
2025-11-14 17:19:50,339 - INFO - Finished converting document 4_2025-05-02 in 0.06 sec.
2025-11-14 17:19:50,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:50,389 - INFO - Going to convert document batch...
2025-11-14 17:19:50,390 - INFO - Processing document 4_2025-05-05
2025-11-14 17:19:50,413 - INFO - Finished converting document 4_2025-05-05 in 0.05 sec.
2025-11-14 17:19:50,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:50,457 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MRK\4_2025-05-01' --> 'data\processed_data\MRK\4_2025-05-01.md'
Converted 'data\edgar_documents\MRK\4_2025-05-02' --> 'data\processed_data\MRK\4_2025-05-02.md'
Converted 'data\edgar_documents\MRK\4_2025-05-05' --> 'data\processed_data\MRK\4_2025-05-05.md'


2025-11-14 17:19:50,658 - INFO - Processing document 4_2025-06-03
2025-11-14 17:19:50,676 - INFO - Finished converting document 4_2025-06-03 in 0.23 sec.
2025-11-14 17:19:50,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:50,734 - INFO - Going to convert document batch...
2025-11-14 17:19:50,737 - INFO - Processing document 4_2025-07-02
2025-11-14 17:19:50,761 - INFO - Finished converting document 4_2025-07-02 in 0.06 sec.
2025-11-14 17:19:50,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:50,819 - INFO - Going to convert document batch...
2025-11-14 17:19:50,820 - INFO - Processing document 4_2025-08-05
2025-11-14 17:19:50,840 - INFO - Finished converting document 4_2025-08-05 in 0.06 sec.
2025-11-14 17:19:50,881 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:19:50,882 - ERROR - Input document 4_2025-09-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>

Converted 'data\edgar_documents\MRK\4_2025-06-03' --> 'data\processed_data\MRK\4_2025-06-03.md'
Converted 'data\edgar_documents\MRK\4_2025-07-02' --> 'data\processed_data\MRK\4_2025-07-02.md'
Converted 'data\edgar_documents\MRK\4_2025-08-05' --> 'data\processed_data\MRK\4_2025-08-05.md'
Error processing data\edgar_documents\MRK\4_2025-09-02: File format not allowed: data\edgar_documents\MRK\4_2025-09-02


2025-11-14 17:19:50,905 - ERROR - Input document 4_2025-09-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:19:50,907 - INFO - Going to convert document batch...
2025-11-14 17:19:50,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:50,931 - INFO - Going to convert document batch...
2025-11-14 17:19:50,932 - INFO - Processing document 4_2025-10-02
2025-11-14 17:19:50,956 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 17:19:50,992 - INFO - detec

Error processing data\edgar_documents\MRK\4_2025-09-04: File format not allowed: data\edgar_documents\MRK\4_2025-09-04
Converted 'data\edgar_documents\MRK\4_2025-10-02' --> 'data\processed_data\MRK\4_2025-10-02.md'
Converted 'data\edgar_documents\MRK\4_2025-11-04' --> 'data\processed_data\MRK\4_2025-11-04.md'


2025-11-14 17:19:51,114 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,124 - INFO - Going to convert document batch...
2025-11-14 17:19:51,125 - INFO - Processing document 8-K_2023-04-27
2025-11-14 17:19:51,149 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 17:19:51,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,221 - INFO - Going to convert document batch...
2025-11-14 17:19:51,222 - INFO - Processing document 8-K_2023-05-17
2025-11-14 17:19:51,246 - INFO - Finished converting document 8-K_2023-05-17 in 0.08 sec.
2025-11-14 17:19:51,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,308 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MRK\8-K_2023-02-02' --> 'data\processed_data\MRK\8-K_2023-02-02.md'
Converted 'data\edgar_documents\MRK\8-K_2023-04-27' --> 'data\processed_data\MRK\8-K_2023-04-27.md'
Converted 'data\edgar_documents\MRK\8-K_2023-05-17' --> 'data\processed_data\MRK\8-K_2023-05-17.md'


2025-11-14 17:19:51,309 - INFO - Processing document 8-K_2023-05-26
2025-11-14 17:19:51,359 - INFO - Finished converting document 8-K_2023-05-26 in 0.11 sec.
2025-11-14 17:19:51,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,408 - INFO - Going to convert document batch...
2025-11-14 17:19:51,409 - INFO - Processing document 8-K_2023-08-01
2025-11-14 17:19:51,432 - INFO - Finished converting document 8-K_2023-08-01 in 0.06 sec.
2025-11-14 17:19:51,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,472 - INFO - Going to convert document batch...
2025-11-14 17:19:51,473 - INFO - Processing document 8-K_2023-10-26
2025-11-14 17:19:51,492 - INFO - Finished converting document 8-K_2023-10-26 in 0.05 sec.
2025-11-14 17:19:51,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,531 - INFO - Going to convert document batch...
2025-11-14 17:19:51,532 - INFO - Processing document 8-K_2023-11-28
2025-11-14 17:

Converted 'data\edgar_documents\MRK\8-K_2023-05-26' --> 'data\processed_data\MRK\8-K_2023-05-26.md'
Converted 'data\edgar_documents\MRK\8-K_2023-08-01' --> 'data\processed_data\MRK\8-K_2023-08-01.md'
Converted 'data\edgar_documents\MRK\8-K_2023-10-26' --> 'data\processed_data\MRK\8-K_2023-10-26.md'
Converted 'data\edgar_documents\MRK\8-K_2023-11-28' --> 'data\processed_data\MRK\8-K_2023-11-28.md'


2025-11-14 17:19:51,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,612 - INFO - Going to convert document batch...
2025-11-14 17:19:51,613 - INFO - Processing document 8-K_2024-02-01
2025-11-14 17:19:51,635 - INFO - Finished converting document 8-K_2024-02-01 in 0.08 sec.
2025-11-14 17:19:51,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,676 - INFO - Going to convert document batch...
2025-11-14 17:19:51,677 - INFO - Processing document 8-K_2024-02-20
2025-11-14 17:19:51,692 - INFO - Finished converting document 8-K_2024-02-20 in 0.03 sec.
2025-11-14 17:19:51,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,730 - INFO - Going to convert document batch...
2025-11-14 17:19:51,731 - INFO - Processing document 8-K_2024-04-25
2025-11-14 17:19:51,751 - INFO - Finished converting document 8-K_2024-04-25 in 0.05 sec.
2025-11-14 17:19:51,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\MRK\8-K_2024-02-01' --> 'data\processed_data\MRK\8-K_2024-02-01.md'
Converted 'data\edgar_documents\MRK\8-K_2024-02-20' --> 'data\processed_data\MRK\8-K_2024-02-20.md'
Converted 'data\edgar_documents\MRK\8-K_2024-04-25' --> 'data\processed_data\MRK\8-K_2024-04-25.md'


2025-11-14 17:19:51,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:51,928 - INFO - Going to convert document batch...
2025-11-14 17:19:51,928 - INFO - Processing document 8-K_2024-07-30
2025-11-14 17:19:51,952 - INFO - Finished converting document 8-K_2024-07-30 in 0.08 sec.
2025-11-14 17:19:51,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:52,006 - INFO - Going to convert document batch...
2025-11-14 17:19:52,008 - INFO - Processing document 8-K_2024-10-31
2025-11-14 17:19:52,046 - INFO - Finished converting document 8-K_2024-10-31 in 0.08 sec.


Converted 'data\edgar_documents\MRK\8-K_2024-05-30' --> 'data\processed_data\MRK\8-K_2024-05-30.md'
Converted 'data\edgar_documents\MRK\8-K_2024-07-30' --> 'data\processed_data\MRK\8-K_2024-07-30.md'


2025-11-14 17:19:52,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:52,099 - INFO - Going to convert document batch...
2025-11-14 17:19:52,100 - INFO - Processing document 8-K_2024-11-22
2025-11-14 17:19:52,131 - INFO - Finished converting document 8-K_2024-11-22 in 0.06 sec.
2025-11-14 17:19:52,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:52,178 - INFO - Going to convert document batch...
2025-11-14 17:19:52,179 - INFO - Processing document 8-K_2025-02-04
2025-11-14 17:19:52,202 - INFO - Finished converting document 8-K_2025-02-04 in 0.05 sec.
2025-11-14 17:19:52,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:52,244 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MRK\8-K_2024-10-31' --> 'data\processed_data\MRK\8-K_2024-10-31.md'
Converted 'data\edgar_documents\MRK\8-K_2024-11-22' --> 'data\processed_data\MRK\8-K_2024-11-22.md'
Converted 'data\edgar_documents\MRK\8-K_2025-02-04' --> 'data\processed_data\MRK\8-K_2025-02-04.md'


2025-11-14 17:19:52,244 - INFO - Processing document 8-K_2025-04-24
2025-11-14 17:19:52,265 - INFO - Finished converting document 8-K_2025-04-24 in 0.05 sec.
2025-11-14 17:19:52,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:52,338 - INFO - Going to convert document batch...
2025-11-14 17:19:52,339 - INFO - Processing document 8-K_2025-05-29
2025-11-14 17:19:52,384 - INFO - Finished converting document 8-K_2025-05-29 in 0.09 sec.
2025-11-14 17:19:52,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:52,431 - INFO - Going to convert document batch...
2025-11-14 17:19:52,432 - INFO - Processing document 8-K_2025-07-29
2025-11-14 17:19:52,459 - INFO - Finished converting document 8-K_2025-07-29 in 0.05 sec.


Converted 'data\edgar_documents\MRK\8-K_2025-04-24' --> 'data\processed_data\MRK\8-K_2025-04-24.md'
Converted 'data\edgar_documents\MRK\8-K_2025-05-29' --> 'data\processed_data\MRK\8-K_2025-05-29.md'


2025-11-14 17:19:52,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:52,507 - INFO - Going to convert document batch...
2025-11-14 17:19:52,508 - INFO - Processing document 8-K_2025-09-09
2025-11-14 17:19:52,532 - INFO - Finished converting document 8-K_2025-09-09 in 0.06 sec.
2025-11-14 17:19:52,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:52,575 - INFO - Going to convert document batch...
2025-11-14 17:19:52,576 - INFO - Processing document 8-K_2025-10-30
2025-11-14 17:19:52,601 - INFO - Finished converting document 8-K_2025-10-30 in 0.05 sec.


Converted 'data\edgar_documents\MRK\8-K_2025-07-29' --> 'data\processed_data\MRK\8-K_2025-07-29.md'
Converted 'data\edgar_documents\MRK\8-K_2025-09-09' --> 'data\processed_data\MRK\8-K_2025-09-09.md'
Converted 'data\edgar_documents\MRK\8-K_2025-10-30' --> 'data\processed_data\MRK\8-K_2025-10-30.md'


2025-11-14 17:19:52,670 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:19:52,671 - ERROR - Input document DEF-14A_2023-04-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:19:52,676 - INFO - Going to convert document batch...
2025-11-14 17:19:52,774 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:19:52,775 - ERROR - Input document DEF-14A_2024-04-11 with format No

Error processing data\edgar_documents\MRK\DEF-14A_2023-04-03: File format not allowed: data\edgar_documents\MRK\DEF-14A_2023-04-03
Error processing data\edgar_documents\MRK\DEF-14A_2024-04-11: File format not allowed: data\edgar_documents\MRK\DEF-14A_2024-04-11
Error processing data\edgar_documents\MRK\DEF-14A_2025-04-09: File format not allowed: data\edgar_documents\MRK\DEF-14A_2025-04-09
Processed 91 new files. Errors: 10
Found 132 files to process in data\edgar_documents\MSFT


2025-11-14 17:19:53,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:19:55,299 - INFO - Going to convert document batch...
2025-11-14 17:19:55,300 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:19:55,301 - INFO - Processing document 10-K_2023-07-27
2025-11-14 17:19:59,538 - INFO - Finished converting document 10-K_2023-07-27 in 6.67 sec.
2025-11-14 17:20:00,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-K_2023-07-27' --> 'data\processed_data\MSFT\10-K_2023-07-27.md'


2025-11-14 17:20:02,764 - INFO - Going to convert document batch...
2025-11-14 17:20:02,764 - INFO - Processing document 10-K_2024-07-30
2025-11-14 17:20:07,032 - INFO - Finished converting document 10-K_2024-07-30 in 6.56 sec.
2025-11-14 17:20:07,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-K_2024-07-30' --> 'data\processed_data\MSFT\10-K_2024-07-30.md'


2025-11-14 17:20:10,110 - INFO - Going to convert document batch...
2025-11-14 17:20:10,111 - INFO - Processing document 10-K_2025-07-30
2025-11-14 17:20:13,920 - INFO - Finished converting document 10-K_2025-07-30 in 6.34 sec.
2025-11-14 17:20:14,526 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:20:14,528 - ERROR - Input document 10-Q_2023-01-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:20:14,534 - INFO - Going to convert d

Converted 'data\edgar_documents\MSFT\10-K_2025-07-30' --> 'data\processed_data\MSFT\10-K_2025-07-30.md'
Error processing data\edgar_documents\MSFT\10-Q_2023-01-24: File format not allowed: data\edgar_documents\MSFT\10-Q_2023-01-24


2025-11-14 17:20:14,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:17,258 - INFO - Going to convert document batch...
2025-11-14 17:20:17,259 - INFO - Processing document 10-Q_2023-04-25
2025-11-14 17:20:19,464 - INFO - Finished converting document 10-Q_2023-04-25 in 4.94 sec.
2025-11-14 17:20:19,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-Q_2023-04-25' --> 'data\processed_data\MSFT\10-Q_2023-04-25.md'


2025-11-14 17:20:20,932 - INFO - Going to convert document batch...
2025-11-14 17:20:20,933 - INFO - Processing document 10-Q_2023-10-24
2025-11-14 17:20:23,281 - INFO - Finished converting document 10-Q_2023-10-24 in 3.42 sec.
2025-11-14 17:20:23,711 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-Q_2023-10-24' --> 'data\processed_data\MSFT\10-Q_2023-10-24.md'


2025-11-14 17:20:25,729 - INFO - Going to convert document batch...
2025-11-14 17:20:25,730 - INFO - Processing document 10-Q_2024-01-30
2025-11-14 17:20:28,146 - INFO - Finished converting document 10-Q_2024-01-30 in 4.55 sec.
2025-11-14 17:20:28,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-Q_2024-01-30' --> 'data\processed_data\MSFT\10-Q_2024-01-30.md'


2025-11-14 17:20:30,654 - INFO - Going to convert document batch...
2025-11-14 17:20:30,655 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 17:20:33,038 - INFO - Finished converting document 10-Q_2024-04-25 in 4.47 sec.
2025-11-14 17:20:33,540 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-Q_2024-04-25' --> 'data\processed_data\MSFT\10-Q_2024-04-25.md'


2025-11-14 17:20:35,292 - INFO - Going to convert document batch...
2025-11-14 17:20:35,293 - INFO - Processing document 10-Q_2024-10-30
2025-11-14 17:20:37,116 - INFO - Finished converting document 10-Q_2024-10-30 in 3.66 sec.
2025-11-14 17:20:37,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-Q_2024-10-30' --> 'data\processed_data\MSFT\10-Q_2024-10-30.md'


2025-11-14 17:20:39,903 - INFO - Going to convert document batch...
2025-11-14 17:20:39,904 - INFO - Processing document 10-Q_2025-01-29
2025-11-14 17:20:42,188 - INFO - Finished converting document 10-Q_2025-01-29 in 4.75 sec.
2025-11-14 17:20:42,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-Q_2025-01-29' --> 'data\processed_data\MSFT\10-Q_2025-01-29.md'


2025-11-14 17:20:44,681 - INFO - Going to convert document batch...
2025-11-14 17:20:44,682 - INFO - Processing document 10-Q_2025-04-30
2025-11-14 17:20:47,022 - INFO - Finished converting document 10-Q_2025-04-30 in 4.42 sec.
2025-11-14 17:20:47,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-Q_2025-04-30' --> 'data\processed_data\MSFT\10-Q_2025-04-30.md'


2025-11-14 17:20:49,337 - INFO - Going to convert document batch...
2025-11-14 17:20:49,338 - INFO - Processing document 10-Q_2025-10-29
2025-11-14 17:20:51,212 - INFO - Finished converting document 10-Q_2025-10-29 in 3.78 sec.
2025-11-14 17:20:51,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:51,584 - INFO - Going to convert document batch...
2025-11-14 17:20:51,584 - INFO - Processing document 4_2023-01-18
2025-11-14 17:20:51,601 - INFO - Finished converting document 4_2023-01-18 in 0.06 sec.
2025-11-14 17:20:51,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:51,662 - INFO - Going to convert document batch...
2025-11-14 17:20:51,663 - INFO - Processing document 4_2023-02-01
2025-11-14 17:20:51,683 - INFO - Finished converting document 4_2023-02-01 in 0.06 sec.
2025-11-14 17:20:51,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\10-Q_2025-10-29' --> 'data\processed_data\MSFT\10-Q_2025-10-29.md'
Converted 'data\edgar_documents\MSFT\4_2023-01-18' --> 'data\processed_data\MSFT\4_2023-01-18.md'
Converted 'data\edgar_documents\MSFT\4_2023-02-01' --> 'data\processed_data\MSFT\4_2023-02-01.md'


2025-11-14 17:20:51,722 - INFO - Going to convert document batch...
2025-11-14 17:20:51,723 - INFO - Processing document 4_2023-02-13
2025-11-14 17:20:51,740 - INFO - Finished converting document 4_2023-02-13 in 0.03 sec.
2025-11-14 17:20:51,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:51,780 - INFO - Going to convert document batch...
2025-11-14 17:20:51,781 - INFO - Processing document 4_2023-02-15
2025-11-14 17:20:51,798 - INFO - Finished converting document 4_2023-02-15 in 0.05 sec.
2025-11-14 17:20:51,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:51,853 - INFO - Going to convert document batch...
2025-11-14 17:20:51,854 - INFO - Processing document 4_2023-03-02
2025-11-14 17:20:51,875 - INFO - Finished converting document 4_2023-03-02 in 0.06 sec.
2025-11-14 17:20:51,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:51,926 - INFO - Going to convert document batch...
2025-11-14 17:20:51,927 - 

Converted 'data\edgar_documents\MSFT\4_2023-02-13' --> 'data\processed_data\MSFT\4_2023-02-13.md'
Converted 'data\edgar_documents\MSFT\4_2023-02-15' --> 'data\processed_data\MSFT\4_2023-02-15.md'
Converted 'data\edgar_documents\MSFT\4_2023-03-02' --> 'data\processed_data\MSFT\4_2023-03-02.md'


2025-11-14 17:20:51,958 - INFO - Finished converting document 4_2023-03-10 in 0.06 sec.
2025-11-14 17:20:52,002 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,018 - INFO - Going to convert document batch...
2025-11-14 17:20:52,020 - INFO - Processing document 4_2023-04-18
2025-11-14 17:20:52,048 - INFO - Finished converting document 4_2023-04-18 in 0.06 sec.
2025-11-14 17:20:52,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,095 - INFO - Going to convert document batch...
2025-11-14 17:20:52,096 - INFO - Processing document 4_2023-05-02
2025-11-14 17:20:52,116 - INFO - Finished converting document 4_2023-05-02 in 0.03 sec.
2025-11-14 17:20:52,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,163 - INFO - Going to convert document batch...
2025-11-14 17:20:52,164 - INFO - Processing document 4_2023-05-08


Converted 'data\edgar_documents\MSFT\4_2023-03-10' --> 'data\processed_data\MSFT\4_2023-03-10.md'
Converted 'data\edgar_documents\MSFT\4_2023-04-18' --> 'data\processed_data\MSFT\4_2023-04-18.md'
Converted 'data\edgar_documents\MSFT\4_2023-05-02' --> 'data\processed_data\MSFT\4_2023-05-02.md'


2025-11-14 17:20:52,184 - INFO - Finished converting document 4_2023-05-08 in 0.05 sec.
2025-11-14 17:20:52,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,236 - INFO - Going to convert document batch...
2025-11-14 17:20:52,237 - INFO - Processing document 4_2023-05-10
2025-11-14 17:20:52,276 - INFO - Finished converting document 4_2023-05-10 in 0.08 sec.
2025-11-14 17:20:52,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,330 - INFO - Going to convert document batch...
2025-11-14 17:20:52,330 - INFO - Processing document 4_2023-05-17
2025-11-14 17:20:52,353 - INFO - Finished converting document 4_2023-05-17 in 0.05 sec.
2025-11-14 17:20:52,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\4_2023-05-08' --> 'data\processed_data\MSFT\4_2023-05-08.md'
Converted 'data\edgar_documents\MSFT\4_2023-05-10' --> 'data\processed_data\MSFT\4_2023-05-10.md'
Converted 'data\edgar_documents\MSFT\4_2023-05-17' --> 'data\processed_data\MSFT\4_2023-05-17.md'


2025-11-14 17:20:52,397 - INFO - Going to convert document batch...
2025-11-14 17:20:52,397 - INFO - Processing document 4_2023-05-19
2025-11-14 17:20:52,414 - INFO - Finished converting document 4_2023-05-19 in 0.03 sec.
2025-11-14 17:20:52,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,461 - INFO - Going to convert document batch...
2025-11-14 17:20:52,462 - INFO - Processing document 4_2023-05-31
2025-11-14 17:20:52,484 - INFO - Finished converting document 4_2023-05-31 in 0.05 sec.
2025-11-14 17:20:52,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,528 - INFO - Going to convert document batch...
2025-11-14 17:20:52,529 - INFO - Processing document 4_2023-06-05
2025-11-14 17:20:52,550 - INFO - Finished converting document 4_2023-06-05 in 0.05 sec.
2025-11-14 17:20:52,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,617 - INFO - Going to convert document batch...
2025-11-14 17:20:52,618 - 

Converted 'data\edgar_documents\MSFT\4_2023-05-19' --> 'data\processed_data\MSFT\4_2023-05-19.md'
Converted 'data\edgar_documents\MSFT\4_2023-05-31' --> 'data\processed_data\MSFT\4_2023-05-31.md'
Converted 'data\edgar_documents\MSFT\4_2023-06-05' --> 'data\processed_data\MSFT\4_2023-06-05.md'


2025-11-14 17:20:52,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,679 - INFO - Going to convert document batch...
2025-11-14 17:20:52,680 - INFO - Processing document 4_2023-06-09
2025-11-14 17:20:52,702 - INFO - Finished converting document 4_2023-06-09 in 0.05 sec.
2025-11-14 17:20:52,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,777 - INFO - Going to convert document batch...
2025-11-14 17:20:52,778 - INFO - Processing document 4_2023-06-14
2025-11-14 17:20:52,804 - INFO - Finished converting document 4_2023-06-14 in 0.06 sec.
2025-11-14 17:20:52,844 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\4_2023-06-08' --> 'data\processed_data\MSFT\4_2023-06-08.md'
Converted 'data\edgar_documents\MSFT\4_2023-06-09' --> 'data\processed_data\MSFT\4_2023-06-09.md'
Converted 'data\edgar_documents\MSFT\4_2023-06-14' --> 'data\processed_data\MSFT\4_2023-06-14.md'


2025-11-14 17:20:52,851 - INFO - Going to convert document batch...
2025-11-14 17:20:52,852 - INFO - Processing document 4_2023-07-18
2025-11-14 17:20:52,870 - INFO - Finished converting document 4_2023-07-18 in 0.05 sec.
2025-11-14 17:20:52,904 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,912 - INFO - Going to convert document batch...
2025-11-14 17:20:52,913 - INFO - Processing document 4_2023-08-02
2025-11-14 17:20:52,932 - INFO - Finished converting document 4_2023-08-02 in 0.05 sec.
2025-11-14 17:20:52,977 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:52,992 - INFO - Going to convert document batch...
2025-11-14 17:20:52,993 - INFO - Processing document 4_2023-08-07
2025-11-14 17:20:53,015 - INFO - Finished converting document 4_2023-08-07 in 0.06 sec.
2025-11-14 17:20:53,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,054 - INFO - Going to convert document batch...
2025-11-14 17:20:53,054 - 

Converted 'data\edgar_documents\MSFT\4_2023-07-18' --> 'data\processed_data\MSFT\4_2023-07-18.md'
Converted 'data\edgar_documents\MSFT\4_2023-08-02' --> 'data\processed_data\MSFT\4_2023-08-02.md'
Converted 'data\edgar_documents\MSFT\4_2023-08-07' --> 'data\processed_data\MSFT\4_2023-08-07.md'


2025-11-14 17:20:53,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,114 - INFO - Going to convert document batch...
2025-11-14 17:20:53,115 - INFO - Processing document 4_2023-09-05
2025-11-14 17:20:53,132 - INFO - Finished converting document 4_2023-09-05 in 0.03 sec.
2025-11-14 17:20:53,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,192 - INFO - Going to convert document batch...
2025-11-14 17:20:53,193 - INFO - Processing document 4_2023-09-15
2025-11-14 17:20:53,218 - INFO - Finished converting document 4_2023-09-15 in 0.06 sec.
2025-11-14 17:20:53,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,261 - INFO - Going to convert document batch...
2025-11-14 17:20:53,262 - INFO - Processing document 4_2023-09-19
2025-11-14 17:20:53,279 - INFO - Finished converting document 4_2023-09-19 in 0.05 sec.


Converted 'data\edgar_documents\MSFT\4_2023-09-01' --> 'data\processed_data\MSFT\4_2023-09-01.md'
Converted 'data\edgar_documents\MSFT\4_2023-09-05' --> 'data\processed_data\MSFT\4_2023-09-05.md'
Converted 'data\edgar_documents\MSFT\4_2023-09-15' --> 'data\processed_data\MSFT\4_2023-09-15.md'


2025-11-14 17:20:53,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,329 - INFO - Going to convert document batch...
2025-11-14 17:20:53,329 - INFO - Processing document 4_2023-10-17
2025-11-14 17:20:53,349 - INFO - Finished converting document 4_2023-10-17 in 0.03 sec.
2025-11-14 17:20:53,389 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,398 - INFO - Going to convert document batch...
2025-11-14 17:20:53,399 - INFO - Processing document 4_2023-11-02
2025-11-14 17:20:53,416 - INFO - Finished converting document 4_2023-11-02 in 0.05 sec.
2025-11-14 17:20:53,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,455 - INFO - Going to convert document batch...
2025-11-14 17:20:53,455 - INFO - Processing document 4_2023-11-14
2025-11-14 17:20:53,472 - INFO - Finished converting document 4_2023-11-14 in 0.03 sec.
2025-11-14 17:20:53,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\4_2023-09-19' --> 'data\processed_data\MSFT\4_2023-09-19.md'
Converted 'data\edgar_documents\MSFT\4_2023-10-17' --> 'data\processed_data\MSFT\4_2023-10-17.md'
Converted 'data\edgar_documents\MSFT\4_2023-11-02' --> 'data\processed_data\MSFT\4_2023-11-02.md'
Converted 'data\edgar_documents\MSFT\4_2023-11-14' --> 'data\processed_data\MSFT\4_2023-11-14.md'


2025-11-14 17:20:53,511 - INFO - Going to convert document batch...
2025-11-14 17:20:53,512 - INFO - Processing document 4_2023-12-01
2025-11-14 17:20:53,531 - INFO - Finished converting document 4_2023-12-01 in 0.05 sec.
2025-11-14 17:20:53,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,588 - INFO - Going to convert document batch...
2025-11-14 17:20:53,589 - INFO - Processing document 4_2023-12-07
2025-11-14 17:20:53,608 - INFO - Finished converting document 4_2023-12-07 in 0.06 sec.
2025-11-14 17:20:53,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,647 - INFO - Going to convert document batch...
2025-11-14 17:20:53,648 - INFO - Processing document 4_2023-12-11
2025-11-14 17:20:53,665 - INFO - Finished converting document 4_2023-12-11 in 0.03 sec.
2025-11-14 17:20:53,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,708 - INFO - Going to convert document batch...
2025-11-14 17:20:53,709 - 

Converted 'data\edgar_documents\MSFT\4_2023-12-01' --> 'data\processed_data\MSFT\4_2023-12-01.md'
Converted 'data\edgar_documents\MSFT\4_2023-12-07' --> 'data\processed_data\MSFT\4_2023-12-07.md'
Converted 'data\edgar_documents\MSFT\4_2023-12-11' --> 'data\processed_data\MSFT\4_2023-12-11.md'
Converted 'data\edgar_documents\MSFT\4_2023-12-15' --> 'data\processed_data\MSFT\4_2023-12-15.md'


2025-11-14 17:20:53,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,785 - INFO - Going to convert document batch...
2025-11-14 17:20:53,786 - INFO - Processing document 4_2023-12-29
2025-11-14 17:20:53,807 - INFO - Finished converting document 4_2023-12-29 in 0.05 sec.
2025-11-14 17:20:53,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,862 - INFO - Going to convert document batch...
2025-11-14 17:20:53,863 - INFO - Processing document 4_2024-01-16
2025-11-14 17:20:53,893 - INFO - Finished converting document 4_2024-01-16 in 0.06 sec.
2025-11-14 17:20:53,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:53,934 - INFO - Going to convert document batch...
2025-11-14 17:20:53,934 - INFO - Processing document 4_2024-02-01
2025-11-14 17:20:53,956 - INFO - Finished converting document 4_2024-02-01 in 0.05 sec.
2025-11-14 17:20:53,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\MSFT\4_2023-12-29' --> 'data\processed_data\MSFT\4_2023-12-29.md'
Converted 'data\edgar_documents\MSFT\4_2024-01-16' --> 'data\processed_data\MSFT\4_2024-01-16.md'
Converted 'data\edgar_documents\MSFT\4_2024-02-01' --> 'data\processed_data\MSFT\4_2024-02-01.md'


2025-11-14 17:20:54,059 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:54,074 - INFO - Going to convert document batch...
2025-11-14 17:20:54,075 - INFO - Processing document 4_2024-02-26
2025-11-14 17:20:54,115 - INFO - Finished converting document 4_2024-02-26 in 0.06 sec.
2025-11-14 17:20:54,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:54,223 - INFO - Going to convert document batch...
2025-11-14 17:20:54,224 - INFO - Processing document 4_2024-03-04
2025-11-14 17:20:54,241 - INFO - Finished converting document 4_2024-03-04 in 0.05 sec.


Converted 'data\edgar_documents\MSFT\4_2024-02-06' --> 'data\processed_data\MSFT\4_2024-02-06.md'
Converted 'data\edgar_documents\MSFT\4_2024-02-26' --> 'data\processed_data\MSFT\4_2024-02-26.md'


2025-11-14 17:20:54,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:54,280 - INFO - Going to convert document batch...
2025-11-14 17:20:54,281 - INFO - Processing document 4_2024-03-12
2025-11-14 17:20:54,299 - INFO - Finished converting document 4_2024-03-12 in 0.05 sec.
2025-11-14 17:20:54,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:54,343 - INFO - Going to convert document batch...
2025-11-14 17:20:54,344 - INFO - Processing document 4_2024-03-15
2025-11-14 17:20:54,366 - INFO - Finished converting document 4_2024-03-15 in 0.03 sec.
2025-11-14 17:20:54,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:54,404 - INFO - Going to convert document batch...
2025-11-14 17:20:54,404 - INFO - Processing document 4_2024-04-16
2025-11-14 17:20:54,422 - INFO - Finished converting document 4_2024-04-16 in 0.03 sec.


Converted 'data\edgar_documents\MSFT\4_2024-03-04' --> 'data\processed_data\MSFT\4_2024-03-04.md'
Converted 'data\edgar_documents\MSFT\4_2024-03-12' --> 'data\processed_data\MSFT\4_2024-03-12.md'
Converted 'data\edgar_documents\MSFT\4_2024-03-15' --> 'data\processed_data\MSFT\4_2024-03-15.md'


2025-11-14 17:20:54,457 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:20:54,458 - ERROR - Input document 4_2024-05-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:20:54,459 - INFO - Going to convert document batch...
2025-11-14 17:20:54,471 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:54,480 - INFO - Going to convert document batch...
2025-11-14 17:20:54,482 - INFO - Processing document 4_2024-05-24
2025-11-14 17:20:54,502 - INFO - Fin

Converted 'data\edgar_documents\MSFT\4_2024-04-16' --> 'data\processed_data\MSFT\4_2024-04-16.md'
Error processing data\edgar_documents\MSFT\4_2024-05-06: File format not allowed: data\edgar_documents\MSFT\4_2024-05-06
Converted 'data\edgar_documents\MSFT\4_2024-05-24' --> 'data\processed_data\MSFT\4_2024-05-24.md'
Converted 'data\edgar_documents\MSFT\4_2024-06-03' --> 'data\processed_data\MSFT\4_2024-06-03.md'


2025-11-14 17:20:54,628 - INFO - Going to convert document batch...
2025-11-14 17:20:54,629 - INFO - Processing document 4_2024-06-04
2025-11-14 17:20:55,336 - INFO - Finished converting document 4_2024-06-04 in 0.72 sec.
2025-11-14 17:20:55,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:55,374 - INFO - Going to convert document batch...
2025-11-14 17:20:55,375 - INFO - Processing document 4_2024-06-07
2025-11-14 17:20:55,392 - INFO - Finished converting document 4_2024-06-07 in 0.03 sec.
2025-11-14 17:20:55,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:55,431 - INFO - Going to convert document batch...
2025-11-14 17:20:55,431 - INFO - Processing document 4_2024-06-14
2025-11-14 17:20:55,450 - INFO - Finished converting document 4_2024-06-14 in 0.05 sec.
2025-11-14 17:20:55,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:55,512 - INFO - Going to convert document batch...
2025-11-14 17:20:55,513 - 

Converted 'data\edgar_documents\MSFT\4_2024-06-04' --> 'data\processed_data\MSFT\4_2024-06-04.md'
Converted 'data\edgar_documents\MSFT\4_2024-06-07' --> 'data\processed_data\MSFT\4_2024-06-07.md'
Converted 'data\edgar_documents\MSFT\4_2024-06-14' --> 'data\processed_data\MSFT\4_2024-06-14.md'
Converted 'data\edgar_documents\MSFT\4_2024-07-16' --> 'data\processed_data\MSFT\4_2024-07-16.md'


2025-11-14 17:20:55,567 - INFO - Going to convert document batch...
2025-11-14 17:20:55,568 - INFO - Processing document 4_2024-08-26
2025-11-14 17:20:55,591 - INFO - Finished converting document 4_2024-08-26 in 0.05 sec.
2025-11-14 17:20:55,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:55,635 - INFO - Going to convert document batch...
2025-11-14 17:20:55,637 - INFO - Processing document 4_2024-09-03
2025-11-14 17:20:55,657 - INFO - Finished converting document 4_2024-09-03 in 0.05 sec.
2025-11-14 17:20:55,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:55,697 - INFO - Going to convert document batch...
2025-11-14 17:20:55,698 - INFO - Processing document 4_2024-09-05
2025-11-14 17:20:55,725 - INFO - Finished converting document 4_2024-09-05 in 0.05 sec.
2025-11-14 17:20:55,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:55,771 - INFO - Going to convert document batch...
2025-11-14 17:20:55,772 - 

Converted 'data\edgar_documents\MSFT\4_2024-08-26' --> 'data\processed_data\MSFT\4_2024-08-26.md'
Converted 'data\edgar_documents\MSFT\4_2024-09-03' --> 'data\processed_data\MSFT\4_2024-09-03.md'
Converted 'data\edgar_documents\MSFT\4_2024-09-05' --> 'data\processed_data\MSFT\4_2024-09-05.md'


2025-11-14 17:20:55,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:55,828 - INFO - Going to convert document batch...
2025-11-14 17:20:55,828 - INFO - Processing document 4_2024-09-09
2025-11-14 17:20:55,847 - INFO - Finished converting document 4_2024-09-09 in 0.03 sec.
2025-11-14 17:20:55,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:55,889 - INFO - Going to convert document batch...
2025-11-14 17:20:55,889 - INFO - Processing document 4_2024-09-11
2025-11-14 17:20:55,906 - INFO - Finished converting document 4_2024-09-11 in 0.05 sec.
2025-11-14 17:20:55,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:55,946 - INFO - Going to convert document batch...
2025-11-14 17:20:55,946 - INFO - Processing document 4_2024-09-13
2025-11-14 17:20:55,966 - INFO - Finished converting document 4_2024-09-13 in 0.05 sec.
2025-11-14 17:20:55,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\4_2024-09-06' --> 'data\processed_data\MSFT\4_2024-09-06.md'
Converted 'data\edgar_documents\MSFT\4_2024-09-09' --> 'data\processed_data\MSFT\4_2024-09-09.md'
Converted 'data\edgar_documents\MSFT\4_2024-09-11' --> 'data\processed_data\MSFT\4_2024-09-11.md'
Converted 'data\edgar_documents\MSFT\4_2024-09-13' --> 'data\processed_data\MSFT\4_2024-09-13.md'


2025-11-14 17:20:56,005 - INFO - Going to convert document batch...
2025-11-14 17:20:56,007 - INFO - Processing document 4_2024-09-18
2025-11-14 17:20:56,027 - INFO - Finished converting document 4_2024-09-18 in 0.05 sec.
2025-11-14 17:20:56,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,072 - INFO - Going to convert document batch...
2025-11-14 17:20:56,073 - INFO - Processing document 4_2024-11-12
2025-11-14 17:20:56,094 - INFO - Finished converting document 4_2024-11-12 in 0.05 sec.
2025-11-14 17:20:56,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,146 - INFO - Going to convert document batch...
2025-11-14 17:20:56,147 - INFO - Processing document 4_2024-11-14
2025-11-14 17:20:56,164 - INFO - Finished converting document 4_2024-11-14 in 0.03 sec.
2025-11-14 17:20:56,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,202 - INFO - Going to convert document batch...
2025-11-14 17:20:56,203 - 

Converted 'data\edgar_documents\MSFT\4_2024-09-18' --> 'data\processed_data\MSFT\4_2024-09-18.md'
Converted 'data\edgar_documents\MSFT\4_2024-11-12' --> 'data\processed_data\MSFT\4_2024-11-12.md'
Converted 'data\edgar_documents\MSFT\4_2024-11-14' --> 'data\processed_data\MSFT\4_2024-11-14.md'


2025-11-14 17:20:56,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,256 - INFO - Going to convert document batch...
2025-11-14 17:20:56,257 - INFO - Processing document 4_2024-12-02
2025-11-14 17:20:56,275 - INFO - Finished converting document 4_2024-12-02 in 0.05 sec.
2025-11-14 17:20:56,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,317 - INFO - Going to convert document batch...
2025-11-14 17:20:56,318 - INFO - Processing document 4_2024-12-05
2025-11-14 17:20:56,335 - INFO - Finished converting document 4_2024-12-05 in 0.03 sec.
2025-11-14 17:20:56,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,373 - INFO - Going to convert document batch...
2025-11-14 17:20:56,374 - INFO - Processing document 4_2024-12-10
2025-11-14 17:20:56,391 - INFO - Finished converting document 4_2024-12-10 in 0.03 sec.
2025-11-14 17:20:56,419 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\4_2024-11-25' --> 'data\processed_data\MSFT\4_2024-11-25.md'
Converted 'data\edgar_documents\MSFT\4_2024-12-02' --> 'data\processed_data\MSFT\4_2024-12-02.md'
Converted 'data\edgar_documents\MSFT\4_2024-12-05' --> 'data\processed_data\MSFT\4_2024-12-05.md'
Converted 'data\edgar_documents\MSFT\4_2024-12-10' --> 'data\processed_data\MSFT\4_2024-12-10.md'


2025-11-14 17:20:56,428 - INFO - Going to convert document batch...
2025-11-14 17:20:56,428 - INFO - Processing document 4_2024-12-13
2025-11-14 17:20:56,447 - INFO - Finished converting document 4_2024-12-13 in 0.03 sec.
2025-11-14 17:20:56,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,507 - INFO - Going to convert document batch...
2025-11-14 17:20:56,510 - INFO - Processing document 4_2024-12-16
2025-11-14 17:20:56,539 - INFO - Finished converting document 4_2024-12-16 in 0.06 sec.
2025-11-14 17:20:56,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,577 - INFO - Going to convert document batch...
2025-11-14 17:20:56,577 - INFO - Processing document 4_2025-02-03
2025-11-14 17:20:56,597 - INFO - Finished converting document 4_2025-02-03 in 0.03 sec.
2025-11-14 17:20:56,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,639 - INFO - Going to convert document batch...
2025-11-14 17:20:56,640 - 

Converted 'data\edgar_documents\MSFT\4_2024-12-13' --> 'data\processed_data\MSFT\4_2024-12-13.md'
Converted 'data\edgar_documents\MSFT\4_2024-12-16' --> 'data\processed_data\MSFT\4_2024-12-16.md'
Converted 'data\edgar_documents\MSFT\4_2025-02-03' --> 'data\processed_data\MSFT\4_2025-02-03.md'


2025-11-14 17:20:56,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,713 - INFO - Going to convert document batch...
2025-11-14 17:20:56,714 - INFO - Processing document 4_2025-03-14
2025-11-14 17:20:56,735 - INFO - Finished converting document 4_2025-03-14 in 0.06 sec.
2025-11-14 17:20:56,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,778 - INFO - Going to convert document batch...
2025-11-14 17:20:56,779 - INFO - Processing document 4_2025-04-16
2025-11-14 17:20:56,798 - INFO - Finished converting document 4_2025-04-16 in 0.05 sec.
2025-11-14 17:20:56,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,840 - INFO - Going to convert document batch...
2025-11-14 17:20:56,840 - INFO - Processing document 4_2025-05-06
2025-11-14 17:20:56,859 - INFO - Finished converting document 4_2025-05-06 in 0.05 sec.


Converted 'data\edgar_documents\MSFT\4_2025-03-03' --> 'data\processed_data\MSFT\4_2025-03-03.md'
Converted 'data\edgar_documents\MSFT\4_2025-03-14' --> 'data\processed_data\MSFT\4_2025-03-14.md'
Converted 'data\edgar_documents\MSFT\4_2025-04-16' --> 'data\processed_data\MSFT\4_2025-04-16.md'


2025-11-14 17:20:56,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,910 - INFO - Going to convert document batch...
2025-11-14 17:20:56,911 - INFO - Processing document 4_2025-05-16
2025-11-14 17:20:56,933 - INFO - Finished converting document 4_2025-05-16 in 0.06 sec.
2025-11-14 17:20:56,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:56,983 - INFO - Going to convert document batch...
2025-11-14 17:20:56,984 - INFO - Processing document 4_2025-05-20
2025-11-14 17:20:57,004 - INFO - Finished converting document 4_2025-05-20 in 0.05 sec.
2025-11-14 17:20:57,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,044 - INFO - Going to convert document batch...
2025-11-14 17:20:57,045 - INFO - Processing document 4_2025-05-22
2025-11-14 17:20:57,065 - INFO - Finished converting document 4_2025-05-22 in 0.03 sec.


Converted 'data\edgar_documents\MSFT\4_2025-05-06' --> 'data\processed_data\MSFT\4_2025-05-06.md'
Converted 'data\edgar_documents\MSFT\4_2025-05-16' --> 'data\processed_data\MSFT\4_2025-05-16.md'
Converted 'data\edgar_documents\MSFT\4_2025-05-20' --> 'data\processed_data\MSFT\4_2025-05-20.md'


2025-11-14 17:20:57,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,134 - INFO - Going to convert document batch...
2025-11-14 17:20:57,136 - INFO - Processing document 4_2025-06-02
2025-11-14 17:20:57,159 - INFO - Finished converting document 4_2025-06-02 in 0.05 sec.
2025-11-14 17:20:57,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,205 - INFO - Going to convert document batch...
2025-11-14 17:20:57,206 - INFO - Processing document 4_2025-06-04
2025-11-14 17:20:57,244 - INFO - Finished converting document 4_2025-06-04 in 0.06 sec.
2025-11-14 17:20:57,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\4_2025-05-22' --> 'data\processed_data\MSFT\4_2025-05-22.md'
Converted 'data\edgar_documents\MSFT\4_2025-06-02' --> 'data\processed_data\MSFT\4_2025-06-02.md'
Converted 'data\edgar_documents\MSFT\4_2025-06-04' --> 'data\processed_data\MSFT\4_2025-06-04.md'


2025-11-14 17:20:57,302 - INFO - Going to convert document batch...
2025-11-14 17:20:57,302 - INFO - Processing document 4_2025-06-11
2025-11-14 17:20:57,324 - INFO - Finished converting document 4_2025-06-11 in 0.05 sec.
2025-11-14 17:20:57,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,365 - INFO - Going to convert document batch...
2025-11-14 17:20:57,366 - INFO - Processing document 4_2025-06-13
2025-11-14 17:20:57,387 - INFO - Finished converting document 4_2025-06-13 in 0.05 sec.
2025-11-14 17:20:57,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,448 - INFO - Going to convert document batch...
2025-11-14 17:20:57,449 - INFO - Processing document 4_2025-06-16
2025-11-14 17:20:57,466 - INFO - Finished converting document 4_2025-06-16 in 0.06 sec.
2025-11-14 17:20:57,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,509 - INFO - Going to convert document batch...
2025-11-14 17:20:57,509 - 

Converted 'data\edgar_documents\MSFT\4_2025-06-11' --> 'data\processed_data\MSFT\4_2025-06-11.md'
Converted 'data\edgar_documents\MSFT\4_2025-06-13' --> 'data\processed_data\MSFT\4_2025-06-13.md'
Converted 'data\edgar_documents\MSFT\4_2025-06-16' --> 'data\processed_data\MSFT\4_2025-06-16.md'


2025-11-14 17:20:57,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,566 - INFO - Going to convert document batch...
2025-11-14 17:20:57,566 - INFO - Processing document 4_2025-08-11
2025-11-14 17:20:57,584 - INFO - Finished converting document 4_2025-08-11 in 0.03 sec.
2025-11-14 17:20:57,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,625 - INFO - Going to convert document batch...
2025-11-14 17:20:57,626 - INFO - Processing document 4_2025-08-13
2025-11-14 17:20:57,647 - INFO - Finished converting document 4_2025-08-13 in 0.03 sec.
2025-11-14 17:20:57,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,693 - INFO - Going to convert document batch...
2025-11-14 17:20:57,693 - INFO - Processing document 4_2025-08-18
2025-11-14 17:20:57,712 - INFO - Finished converting document 4_2025-08-18 in 0.03 sec.


Converted 'data\edgar_documents\MSFT\4_2025-07-16' --> 'data\processed_data\MSFT\4_2025-07-16.md'
Converted 'data\edgar_documents\MSFT\4_2025-08-11' --> 'data\processed_data\MSFT\4_2025-08-11.md'
Converted 'data\edgar_documents\MSFT\4_2025-08-13' --> 'data\processed_data\MSFT\4_2025-08-13.md'


2025-11-14 17:20:57,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,751 - INFO - Going to convert document batch...
2025-11-14 17:20:57,751 - INFO - Processing document 4_2025-09-03
2025-11-14 17:20:57,773 - INFO - Finished converting document 4_2025-09-03 in 0.03 sec.
2025-11-14 17:20:57,806 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,817 - INFO - Going to convert document batch...
2025-11-14 17:20:57,818 - INFO - Processing document 4_2025-09-04
2025-11-14 17:20:57,846 - INFO - Finished converting document 4_2025-09-04 in 0.05 sec.
2025-11-14 17:20:57,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,892 - INFO - Going to convert document batch...
2025-11-14 17:20:57,893 - INFO - Processing document 4_2025-09-12
2025-11-14 17:20:57,916 - INFO - Finished converting document 4_2025-09-12 in 0.03 sec.


Converted 'data\edgar_documents\MSFT\4_2025-08-18' --> 'data\processed_data\MSFT\4_2025-08-18.md'
Converted 'data\edgar_documents\MSFT\4_2025-09-03' --> 'data\processed_data\MSFT\4_2025-09-03.md'
Converted 'data\edgar_documents\MSFT\4_2025-09-04' --> 'data\processed_data\MSFT\4_2025-09-04.md'


2025-11-14 17:20:57,950 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:57,968 - INFO - Going to convert document batch...
2025-11-14 17:20:57,970 - INFO - Processing document 4_2025-09-15
2025-11-14 17:20:57,999 - INFO - Finished converting document 4_2025-09-15 in 0.06 sec.
2025-11-14 17:20:58,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,062 - INFO - Going to convert document batch...
2025-11-14 17:20:58,063 - INFO - Processing document 4_2025-09-17
2025-11-14 17:20:58,081 - INFO - Finished converting document 4_2025-09-17 in 0.06 sec.
2025-11-14 17:20:58,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,119 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\MSFT\4_2025-09-12' --> 'data\processed_data\MSFT\4_2025-09-12.md'
Converted 'data\edgar_documents\MSFT\4_2025-09-15' --> 'data\processed_data\MSFT\4_2025-09-15.md'
Converted 'data\edgar_documents\MSFT\4_2025-09-17' --> 'data\processed_data\MSFT\4_2025-09-17.md'


2025-11-14 17:20:58,120 - INFO - Processing document 4_2025-10-03
2025-11-14 17:20:58,139 - INFO - Finished converting document 4_2025-10-03 in 0.05 sec.
2025-11-14 17:20:58,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,181 - INFO - Going to convert document batch...
2025-11-14 17:20:58,182 - INFO - Processing document 4_2025-10-15
2025-11-14 17:20:58,199 - INFO - Finished converting document 4_2025-10-15 in 0.05 sec.
2025-11-14 17:20:58,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,259 - INFO - Going to convert document batch...
2025-11-14 17:20:58,260 - INFO - Processing document 4_2025-11-04
2025-11-14 17:20:58,279 - INFO - Finished converting document 4_2025-11-04 in 0.06 sec.
2025-11-14 17:20:58,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,336 - INFO - Going to convert document batch...
2025-11-14 17:20:58,337 - INFO - Processing document 4_2025-11-07
2025-11-14 17:20:58,353 - IN

Converted 'data\edgar_documents\MSFT\4_2025-10-03' --> 'data\processed_data\MSFT\4_2025-10-03.md'
Converted 'data\edgar_documents\MSFT\4_2025-10-15' --> 'data\processed_data\MSFT\4_2025-10-15.md'
Converted 'data\edgar_documents\MSFT\4_2025-11-04' --> 'data\processed_data\MSFT\4_2025-11-04.md'


2025-11-14 17:20:58,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,398 - INFO - Going to convert document batch...
2025-11-14 17:20:58,399 - INFO - Processing document 8-K_2023-01-18
2025-11-14 17:20:58,414 - INFO - Finished converting document 8-K_2023-01-18 in 0.03 sec.
2025-11-14 17:20:58,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,455 - INFO - Going to convert document batch...
2025-11-14 17:20:58,456 - INFO - Processing document 8-K_2023-01-24
2025-11-14 17:20:58,477 - INFO - Finished converting document 8-K_2023-01-24 in 0.05 sec.
2025-11-14 17:20:58,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,517 - INFO - Going to convert document batch...
2025-11-14 17:20:58,519 - INFO - Processing document 8-K_2023-04-25
2025-11-14 17:20:58,534 - INFO - Finished converting document 8-K_2023-04-25 in 0.05 sec.
2025-11-14 17:20:58,558 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\4_2025-11-07' --> 'data\processed_data\MSFT\4_2025-11-07.md'
Converted 'data\edgar_documents\MSFT\8-K_2023-01-18' --> 'data\processed_data\MSFT\8-K_2023-01-18.md'
Converted 'data\edgar_documents\MSFT\8-K_2023-01-24' --> 'data\processed_data\MSFT\8-K_2023-01-24.md'
Converted 'data\edgar_documents\MSFT\8-K_2023-04-25' --> 'data\processed_data\MSFT\8-K_2023-04-25.md'


2025-11-14 17:20:58,568 - INFO - Going to convert document batch...
2025-11-14 17:20:58,569 - INFO - Processing document 8-K_2023-07-03
2025-11-14 17:20:58,588 - INFO - Finished converting document 8-K_2023-07-03 in 0.05 sec.
2025-11-14 17:20:58,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,629 - INFO - Going to convert document batch...
2025-11-14 17:20:58,630 - INFO - Processing document 8-K_2023-07-25
2025-11-14 17:20:58,650 - INFO - Finished converting document 8-K_2023-07-25 in 0.05 sec.
2025-11-14 17:20:58,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,682 - INFO - Going to convert document batch...
2025-11-14 17:20:58,682 - INFO - Processing document 8-K_2023-10-11
2025-11-14 17:20:58,696 - INFO - Finished converting document 8-K_2023-10-11 in 0.03 sec.
2025-11-14 17:20:58,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,726 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\MSFT\8-K_2023-07-03' --> 'data\processed_data\MSFT\8-K_2023-07-03.md'
Converted 'data\edgar_documents\MSFT\8-K_2023-07-25' --> 'data\processed_data\MSFT\8-K_2023-07-25.md'
Converted 'data\edgar_documents\MSFT\8-K_2023-10-11' --> 'data\processed_data\MSFT\8-K_2023-10-11.md'
Converted 'data\edgar_documents\MSFT\8-K_2023-10-13' --> 'data\processed_data\MSFT\8-K_2023-10-13.md'


2025-11-14 17:20:58,795 - INFO - Finished converting document 8-K_2023-10-16 in 0.05 sec.
2025-11-14 17:20:58,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,847 - INFO - Going to convert document batch...
2025-11-14 17:20:58,848 - INFO - Processing document 8-K_2023-10-24
2025-11-14 17:20:58,867 - INFO - Finished converting document 8-K_2023-10-24 in 0.05 sec.
2025-11-14 17:20:58,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,900 - INFO - Going to convert document batch...
2025-11-14 17:20:58,902 - INFO - Processing document 8-K_2023-10-30
2025-11-14 17:20:58,920 - INFO - Finished converting document 8-K_2023-10-30 in 0.05 sec.
2025-11-14 17:20:58,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:58,961 - INFO - Going to convert document batch...
2025-11-14 17:20:58,962 - INFO - Processing document 8-K_2023-11-06
2025-11-14 17:20:59,001 - INFO - Finished converting document 8-K_2023-11-06 in 0.

Converted 'data\edgar_documents\MSFT\8-K_2023-10-16' --> 'data\processed_data\MSFT\8-K_2023-10-16.md'
Converted 'data\edgar_documents\MSFT\8-K_2023-10-24' --> 'data\processed_data\MSFT\8-K_2023-10-24.md'
Converted 'data\edgar_documents\MSFT\8-K_2023-10-30' --> 'data\processed_data\MSFT\8-K_2023-10-30.md'


2025-11-14 17:20:59,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:59,088 - INFO - Going to convert document batch...
2025-11-14 17:20:59,088 - INFO - Processing document 8-K_2023-12-08


Converted 'data\edgar_documents\MSFT\8-K_2023-11-06' --> 'data\processed_data\MSFT\8-K_2023-11-06.md'


2025-11-14 17:20:59,393 - INFO - Finished converting document 8-K_2023-12-08 in 0.38 sec.
2025-11-14 17:20:59,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:59,482 - INFO - Going to convert document batch...
2025-11-14 17:20:59,484 - INFO - Processing document 8-K_2024-01-19
2025-11-14 17:20:59,519 - INFO - Finished converting document 8-K_2024-01-19 in 0.09 sec.
2025-11-14 17:20:59,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:59,587 - INFO - Going to convert document batch...
2025-11-14 17:20:59,588 - INFO - Processing document 8-K_2024-01-30
2025-11-14 17:20:59,608 - INFO - Finished converting document 8-K_2024-01-30 in 0.08 sec.


Converted 'data\edgar_documents\MSFT\8-K_2023-12-08' --> 'data\processed_data\MSFT\8-K_2023-12-08.md'
Converted 'data\edgar_documents\MSFT\8-K_2024-01-19' --> 'data\processed_data\MSFT\8-K_2024-01-19.md'


2025-11-14 17:20:59,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:59,646 - INFO - Going to convert document batch...
2025-11-14 17:20:59,647 - INFO - Processing document 8-K_2024-03-08
2025-11-14 17:20:59,665 - INFO - Finished converting document 8-K_2024-03-08 in 0.03 sec.
2025-11-14 17:20:59,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:59,710 - INFO - Going to convert document batch...
2025-11-14 17:20:59,711 - INFO - Processing document 8-K_2024-04-25
2025-11-14 17:20:59,730 - INFO - Finished converting document 8-K_2024-04-25 in 0.06 sec.
2025-11-14 17:20:59,779 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:59,804 - INFO - Going to convert document batch...
2025-11-14 17:20:59,804 - INFO - Processing document 8-K_2024-07-30
2025-11-14 17:20:59,823 - INFO - Finished converting document 8-K_2024-07-30 in 0.09 sec.


Converted 'data\edgar_documents\MSFT\8-K_2024-01-30' --> 'data\processed_data\MSFT\8-K_2024-01-30.md'
Converted 'data\edgar_documents\MSFT\8-K_2024-03-08' --> 'data\processed_data\MSFT\8-K_2024-03-08.md'
Converted 'data\edgar_documents\MSFT\8-K_2024-04-25' --> 'data\processed_data\MSFT\8-K_2024-04-25.md'


2025-11-14 17:20:59,844 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:59,854 - INFO - Going to convert document batch...
2025-11-14 17:20:59,855 - INFO - Processing document 8-K_2024-08-21
2025-11-14 17:20:59,872 - INFO - Finished converting document 8-K_2024-08-21 in 0.05 sec.
2025-11-14 17:20:59,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:20:59,911 - INFO - Going to convert document batch...
2025-11-14 17:20:59,911 - INFO - Processing document 8-K_2024-10-30
2025-11-14 17:20:59,928 - INFO - Finished converting document 8-K_2024-10-30 in 0.05 sec.
2025-11-14 17:20:59,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\MSFT\8-K_2024-07-30' --> 'data\processed_data\MSFT\8-K_2024-07-30.md'
Converted 'data\edgar_documents\MSFT\8-K_2024-08-21' --> 'data\processed_data\MSFT\8-K_2024-08-21.md'
Converted 'data\edgar_documents\MSFT\8-K_2024-10-30' --> 'data\processed_data\MSFT\8-K_2024-10-30.md'


2025-11-14 17:21:00,044 - INFO - Going to convert document batch...
2025-11-14 17:21:00,045 - INFO - Processing document 8-K_2024-12-03
2025-11-14 17:21:00,149 - INFO - Finished converting document 8-K_2024-12-03 in 0.20 sec.
2025-11-14 17:21:00,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:00,247 - INFO - Going to convert document batch...
2025-11-14 17:21:00,249 - INFO - Processing document 8-K_2024-12-11
2025-11-14 17:21:00,309 - INFO - Finished converting document 8-K_2024-12-11 in 0.16 sec.


Converted 'data\edgar_documents\MSFT\8-K_2024-12-03' --> 'data\processed_data\MSFT\8-K_2024-12-03.md'
Converted 'data\edgar_documents\MSFT\8-K_2024-12-11' --> 'data\processed_data\MSFT\8-K_2024-12-11.md'


2025-11-14 17:21:00,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:00,380 - INFO - Going to convert document batch...
2025-11-14 17:21:00,381 - INFO - Processing document 8-K_2025-01-22
2025-11-14 17:21:00,396 - INFO - Finished converting document 8-K_2025-01-22 in 0.06 sec.
2025-11-14 17:21:00,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:00,456 - INFO - Going to convert document batch...
2025-11-14 17:21:00,457 - INFO - Processing document 8-K_2025-01-29
2025-11-14 17:21:00,483 - INFO - Finished converting document 8-K_2025-01-29 in 0.08 sec.
2025-11-14 17:21:00,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:00,529 - INFO - Going to convert document batch...
2025-11-14 17:21:00,530 - INFO - Processing document 8-K_2025-04-30
2025-11-14 17:21:00,548 - INFO - Finished converting document 8-K_2025-04-30 in 0.05 sec.
2025-11-14 17:21:00,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\MSFT\8-K_2025-01-22' --> 'data\processed_data\MSFT\8-K_2025-01-22.md'
Converted 'data\edgar_documents\MSFT\8-K_2025-01-29' --> 'data\processed_data\MSFT\8-K_2025-01-29.md'
Converted 'data\edgar_documents\MSFT\8-K_2025-04-30' --> 'data\processed_data\MSFT\8-K_2025-04-30.md'


2025-11-14 17:21:00,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:00,638 - INFO - Going to convert document batch...
2025-11-14 17:21:00,639 - INFO - Processing document 8-K_2025-07-30
2025-11-14 17:21:00,660 - INFO - Finished converting document 8-K_2025-07-30 in 0.05 sec.
2025-11-14 17:21:00,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:00,697 - INFO - Going to convert document batch...
2025-11-14 17:21:00,697 - INFO - Processing document 8-K_2025-09-30
2025-11-14 17:21:00,713 - INFO - Finished converting document 8-K_2025-09-30 in 0.03 sec.
2025-11-14 17:21:00,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:00,750 - INFO - Going to convert document batch...
2025-11-14 17:21:00,751 - INFO - Processing document 8-K_2025-10-29
2025-11-14 17:21:00,771 - INFO - Finished converting document 8-K_2025-10-29 in 0.05 sec.


Converted 'data\edgar_documents\MSFT\8-K_2025-07-01' --> 'data\processed_data\MSFT\8-K_2025-07-01.md'
Converted 'data\edgar_documents\MSFT\8-K_2025-07-30' --> 'data\processed_data\MSFT\8-K_2025-07-30.md'
Converted 'data\edgar_documents\MSFT\8-K_2025-09-30' --> 'data\processed_data\MSFT\8-K_2025-09-30.md'
Converted 'data\edgar_documents\MSFT\8-K_2025-10-29' --> 'data\processed_data\MSFT\8-K_2025-10-29.md'


2025-11-14 17:21:00,817 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:00,818 - ERROR - Input document DEF-14A_2023-10-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:21:00,820 - INFO - Going to convert document batch...
2025-11-14 17:21:00,864 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:00,865 - ERROR - Input document DEF-14A_2024-10-24 with format No

Error processing data\edgar_documents\MSFT\DEF-14A_2023-10-19: File format not allowed: data\edgar_documents\MSFT\DEF-14A_2023-10-19
Error processing data\edgar_documents\MSFT\DEF-14A_2024-10-24: File format not allowed: data\edgar_documents\MSFT\DEF-14A_2024-10-24
Error processing data\edgar_documents\MSFT\DEF-14A_2025-10-21: File format not allowed: data\edgar_documents\MSFT\DEF-14A_2025-10-21
Processed 127 new files. Errors: 5
Found 159 files to process in data\edgar_documents\NEE


2025-11-14 17:21:01,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:02,275 - INFO - Going to convert document batch...
2025-11-14 17:21:02,276 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:21:02,276 - INFO - Processing document 10-K_2023-02-17
2025-11-14 17:21:06,691 - INFO - Finished converting document 10-K_2023-02-17 in 5.77 sec.
2025-11-14 17:21:07,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-K_2023-02-17' --> 'data\processed_data\NEE\10-K_2023-02-17.md'


2025-11-14 17:21:09,128 - INFO - Going to convert document batch...
2025-11-14 17:21:09,128 - INFO - Processing document 10-K_2024-02-16
2025-11-14 17:21:13,234 - INFO - Finished converting document 10-K_2024-02-16 in 5.55 sec.
2025-11-14 17:21:14,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-K_2024-02-16' --> 'data\processed_data\NEE\10-K_2024-02-16.md'


2025-11-14 17:21:15,872 - INFO - Going to convert document batch...
2025-11-14 17:21:15,873 - INFO - Processing document 10-K_2025-02-14
2025-11-14 17:21:19,996 - INFO - Finished converting document 10-K_2025-02-14 in 5.80 sec.
2025-11-14 17:21:21,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-K_2025-02-14' --> 'data\processed_data\NEE\10-K_2025-02-14.md'


2025-11-14 17:21:22,153 - INFO - Going to convert document batch...
2025-11-14 17:21:22,154 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 17:21:23,485 - INFO - Finished converting document 10-Q_2023-04-26 in 2.50 sec.
2025-11-14 17:21:24,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-Q_2023-04-26' --> 'data\processed_data\NEE\10-Q_2023-04-26.md'


2025-11-14 17:21:25,298 - INFO - Going to convert document batch...
2025-11-14 17:21:25,300 - INFO - Processing document 10-Q_2023-07-26
2025-11-14 17:21:26,807 - INFO - Finished converting document 10-Q_2023-07-26 in 2.75 sec.
2025-11-14 17:21:27,512 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-Q_2023-07-26' --> 'data\processed_data\NEE\10-Q_2023-07-26.md'


2025-11-14 17:21:28,614 - INFO - Going to convert document batch...
2025-11-14 17:21:28,615 - INFO - Processing document 10-Q_2023-11-07
2025-11-14 17:21:30,147 - INFO - Finished converting document 10-Q_2023-11-07 in 2.67 sec.
2025-11-14 17:21:30,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-Q_2023-11-07' --> 'data\processed_data\NEE\10-Q_2023-11-07.md'


2025-11-14 17:21:31,919 - INFO - Going to convert document batch...
2025-11-14 17:21:31,920 - INFO - Processing document 10-Q_2024-04-23
2025-11-14 17:21:33,198 - INFO - Finished converting document 10-Q_2024-04-23 in 2.39 sec.
2025-11-14 17:21:33,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-Q_2024-04-23' --> 'data\processed_data\NEE\10-Q_2024-04-23.md'


2025-11-14 17:21:34,501 - INFO - Going to convert document batch...
2025-11-14 17:21:34,501 - INFO - Processing document 10-Q_2024-07-24
2025-11-14 17:21:36,480 - INFO - Finished converting document 10-Q_2024-07-24 in 2.69 sec.
2025-11-14 17:21:37,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-Q_2024-07-24' --> 'data\processed_data\NEE\10-Q_2024-07-24.md'


2025-11-14 17:21:37,895 - INFO - Going to convert document batch...
2025-11-14 17:21:37,896 - INFO - Processing document 10-Q_2024-10-23
2025-11-14 17:21:39,405 - INFO - Finished converting document 10-Q_2024-10-23 in 2.27 sec.
2025-11-14 17:21:40,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-Q_2024-10-23' --> 'data\processed_data\NEE\10-Q_2024-10-23.md'


2025-11-14 17:21:41,211 - INFO - Going to convert document batch...
2025-11-14 17:21:41,211 - INFO - Processing document 10-Q_2025-04-23
2025-11-14 17:21:42,488 - INFO - Finished converting document 10-Q_2025-04-23 in 1.92 sec.
2025-11-14 17:21:43,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-Q_2025-04-23' --> 'data\processed_data\NEE\10-Q_2025-04-23.md'


2025-11-14 17:21:44,283 - INFO - Going to convert document batch...
2025-11-14 17:21:44,283 - INFO - Processing document 10-Q_2025-07-23
2025-11-14 17:21:45,787 - INFO - Finished converting document 10-Q_2025-07-23 in 2.69 sec.
2025-11-14 17:21:46,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\10-Q_2025-07-23' --> 'data\processed_data\NEE\10-Q_2025-07-23.md'


2025-11-14 17:21:47,628 - INFO - Going to convert document batch...
2025-11-14 17:21:47,629 - INFO - Processing document 10-Q_2025-10-28
2025-11-14 17:21:49,516 - INFO - Finished converting document 10-Q_2025-10-28 in 2.66 sec.
2025-11-14 17:21:50,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:50,234 - INFO - Going to convert document batch...
2025-11-14 17:21:50,235 - INFO - Processing document 4_2023-01-05
2025-11-14 17:21:50,255 - INFO - Finished converting document 4_2023-01-05 in 0.05 sec.
2025-11-14 17:21:50,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:50,306 - INFO - Going to convert document batch...
2025-11-14 17:21:50,306 - INFO - Processing document 4_2023-02-06
2025-11-14 17:21:50,322 - INFO - Finished converting document 4_2023-02-06 in 0.03 sec.
2025-11-14 17:21:50,394 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\NEE\10-Q_2025-10-28' --> 'data\processed_data\NEE\10-Q_2025-10-28.md'
Converted 'data\edgar_documents\NEE\4_2023-01-05' --> 'data\processed_data\NEE\4_2023-01-05.md'
Converted 'data\edgar_documents\NEE\4_2023-02-06' --> 'data\processed_data\NEE\4_2023-02-06.md'


2025-11-14 17:21:50,395 - ERROR - Input document 4_2023-02-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:21:50,397 - INFO - Going to convert document batch...
2025-11-14 17:21:50,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:50,417 - INFO - Going to convert document batch...
2025-11-14 17:21:50,418 - INFO - Processing document 4_2023-02-10
2025-11-14 17:21:50,439 - INFO - Finished converting document 4_2023-02-10 in 0.05 sec.
2025-11-14 17:21:50,473 - INFO - detec

Error processing data\edgar_documents\NEE\4_2023-02-07: File format not allowed: data\edgar_documents\NEE\4_2023-02-07
Converted 'data\edgar_documents\NEE\4_2023-02-10' --> 'data\processed_data\NEE\4_2023-02-10.md'
Converted 'data\edgar_documents\NEE\4_2023-02-17' --> 'data\processed_data\NEE\4_2023-02-17.md'


2025-11-14 17:21:50,597 - INFO - Finished converting document 4_2023-02-21 in 0.06 sec.
2025-11-14 17:21:50,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:50,647 - INFO - Going to convert document batch...
2025-11-14 17:21:50,647 - INFO - Processing document 4_2023-02-22
2025-11-14 17:21:50,664 - INFO - Finished converting document 4_2023-02-22 in 0.03 sec.
2025-11-14 17:21:50,712 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:50,714 - ERROR - Input document 4_2023-02-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\NEE\4_2023-02-21' --> 'data\processed_data\NEE\4_2023-02-21.md'
Converted 'data\edgar_documents\NEE\4_2023-02-22' --> 'data\processed_data\NEE\4_2023-02-22.md'
Error processing data\edgar_documents\NEE\4_2023-02-23: File format not allowed: data\edgar_documents\NEE\4_2023-02-23
Converted 'data\edgar_documents\NEE\4_2023-03-02' --> 'data\processed_data\NEE\4_2023-03-02.md'


2025-11-14 17:21:50,844 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:50,851 - INFO - Going to convert document batch...
2025-11-14 17:21:50,852 - INFO - Processing document 4_2023-03-16
2025-11-14 17:21:50,872 - INFO - Finished converting document 4_2023-03-16 in 0.05 sec.
2025-11-14 17:21:50,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:50,917 - INFO - Going to convert document batch...
2025-11-14 17:21:50,918 - INFO - Processing document 4_2023-04-04
2025-11-14 17:21:50,954 - INFO - Finished converting document 4_2023-04-04 in 0.06 sec.
2025-11-14 17:21:50,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:51,007 - INFO - Going to convert document batch...
2025-11-14 17:21:51,007 - INFO - Processing document 4_2023-05-17


Converted 'data\edgar_documents\NEE\4_2023-03-10' --> 'data\processed_data\NEE\4_2023-03-10.md'
Converted 'data\edgar_documents\NEE\4_2023-03-16' --> 'data\processed_data\NEE\4_2023-03-16.md'
Converted 'data\edgar_documents\NEE\4_2023-04-04' --> 'data\processed_data\NEE\4_2023-04-04.md'


2025-11-14 17:21:51,027 - INFO - Finished converting document 4_2023-05-17 in 0.05 sec.
2025-11-14 17:21:51,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:51,075 - INFO - Going to convert document batch...
2025-11-14 17:21:51,076 - INFO - Processing document 4_2023-05-19
2025-11-14 17:21:51,097 - INFO - Finished converting document 4_2023-05-19 in 0.05 sec.
2025-11-14 17:21:51,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:51,146 - INFO - Going to convert document batch...
2025-11-14 17:21:51,147 - INFO - Processing document 4_2023-06-14
2025-11-14 17:21:51,166 - INFO - Finished converting document 4_2023-06-14 in 0.03 sec.
2025-11-14 17:21:51,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:51,231 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NEE\4_2023-05-17' --> 'data\processed_data\NEE\4_2023-05-17.md'
Converted 'data\edgar_documents\NEE\4_2023-05-19' --> 'data\processed_data\NEE\4_2023-05-19.md'
Converted 'data\edgar_documents\NEE\4_2023-06-14' --> 'data\processed_data\NEE\4_2023-06-14.md'


2025-11-14 17:21:51,231 - INFO - Processing document 4_2023-06-15
2025-11-14 17:21:51,253 - INFO - Finished converting document 4_2023-06-15 in 0.06 sec.
2025-11-14 17:21:51,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:51,300 - INFO - Going to convert document batch...
2025-11-14 17:21:51,301 - INFO - Processing document 4_2023-06-16
2025-11-14 17:21:51,333 - INFO - Finished converting document 4_2023-06-16 in 0.05 sec.
2025-11-14 17:21:51,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:51,384 - INFO - Going to convert document batch...
2025-11-14 17:21:51,385 - INFO - Processing document 4_2023-07-06
2025-11-14 17:21:51,407 - INFO - Finished converting document 4_2023-07-06 in 0.05 sec.
2025-11-14 17:21:51,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:51,461 - INFO - Going to convert document batch...
2025-11-14 17:21:51,462 - INFO - Processing document 4_2023-07-24
2025-11-14 17:21:51,480 - IN

Converted 'data\edgar_documents\NEE\4_2023-06-15' --> 'data\processed_data\NEE\4_2023-06-15.md'
Converted 'data\edgar_documents\NEE\4_2023-06-16' --> 'data\processed_data\NEE\4_2023-06-16.md'
Converted 'data\edgar_documents\NEE\4_2023-07-06' --> 'data\processed_data\NEE\4_2023-07-06.md'


2025-11-14 17:21:51,520 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:51,521 - ERROR - Input document 4_2023-08-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:21:51,523 - INFO - Going to convert document batch...
2025-11-14 17:21:51,545 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:51,546 - ERROR - Input document 4_2023-08-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\NEE\4_2023-07-24' --> 'data\processed_data\NEE\4_2023-07-24.md'
Error processing data\edgar_documents\NEE\4_2023-08-07: File format not allowed: data\edgar_documents\NEE\4_2023-08-07
Error processing data\edgar_documents\NEE\4_2023-08-08: File format not allowed: data\edgar_documents\NEE\4_2023-08-08
Converted 'data\edgar_documents\NEE\4_2023-08-15' --> 'data\processed_data\NEE\4_2023-08-15.md'
Converted 'data\edgar_documents\NEE\4_2023-08-17' --> 'data\processed_data\NEE\4_2023-08-17.md'


2025-11-14 17:21:51,695 - INFO - Going to convert document batch...
2025-11-14 17:21:51,696 - INFO - Processing document 4_2023-09-18
2025-11-14 17:21:51,719 - INFO - Finished converting document 4_2023-09-18 in 0.05 sec.
2025-11-14 17:21:51,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:51,780 - INFO - Going to convert document batch...
2025-11-14 17:21:51,781 - INFO - Processing document 4_2023-10-04
2025-11-14 17:21:51,811 - INFO - Finished converting document 4_2023-10-04 in 0.08 sec.
2025-11-14 17:21:51,844 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:51,852 - INFO - Going to convert document batch...
2025-11-14 17:21:51,852 - INFO - Processing document 4_2023-10-10
2025-11-14 17:21:51,871 - INFO - Finished converting document 4_2023-10-10 in 0.05 sec.
2025-11-14 17:21:51,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\4_2023-09-18' --> 'data\processed_data\NEE\4_2023-09-18.md'
Converted 'data\edgar_documents\NEE\4_2023-10-04' --> 'data\processed_data\NEE\4_2023-10-04.md'
Converted 'data\edgar_documents\NEE\4_2023-10-10' --> 'data\processed_data\NEE\4_2023-10-10.md'


2025-11-14 17:21:51,937 - INFO - Going to convert document batch...
2025-11-14 17:21:51,938 - INFO - Processing document 4_2023-10-13
2025-11-14 17:21:51,957 - INFO - Finished converting document 4_2023-10-13 in 0.06 sec.
2025-11-14 17:21:51,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:52,000 - INFO - Going to convert document batch...
2025-11-14 17:21:52,000 - INFO - Processing document 4_2023-11-16
2025-11-14 17:21:52,021 - INFO - Finished converting document 4_2023-11-16 in 0.05 sec.
2025-11-14 17:21:52,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:52,059 - INFO - Going to convert document batch...
2025-11-14 17:21:52,060 - INFO - Processing document 4_2023-12-11
2025-11-14 17:21:52,077 - INFO - Finished converting document 4_2023-12-11 in 0.05 sec.
2025-11-14 17:21:52,108 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:52,117 - INFO - Going to convert document batch...
2025-11-14 17:21:52,118 - 

Converted 'data\edgar_documents\NEE\4_2023-10-13' --> 'data\processed_data\NEE\4_2023-10-13.md'
Converted 'data\edgar_documents\NEE\4_2023-11-16' --> 'data\processed_data\NEE\4_2023-11-16.md'
Converted 'data\edgar_documents\NEE\4_2023-12-11' --> 'data\processed_data\NEE\4_2023-12-11.md'


2025-11-14 17:21:52,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:52,182 - INFO - Going to convert document batch...
2025-11-14 17:21:52,183 - INFO - Processing document 4_2023-12-18
2025-11-14 17:21:52,206 - INFO - Finished converting document 4_2023-12-18 in 0.05 sec.
2025-11-14 17:21:52,244 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:52,255 - INFO - Going to convert document batch...
2025-11-14 17:21:52,257 - INFO - Processing document 4_2024-01-04
2025-11-14 17:21:52,282 - INFO - Finished converting document 4_2024-01-04 in 0.05 sec.


Converted 'data\edgar_documents\NEE\4_2023-12-15' --> 'data\processed_data\NEE\4_2023-12-15.md'
Converted 'data\edgar_documents\NEE\4_2023-12-18' --> 'data\processed_data\NEE\4_2023-12-18.md'
Converted 'data\edgar_documents\NEE\4_2024-01-04' --> 'data\processed_data\NEE\4_2024-01-04.md'


2025-11-14 17:21:52,374 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:52,375 - ERROR - Input document 4_2024-01-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:21:52,377 - INFO - Going to convert document batch...
2025-11-14 17:21:52,408 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:52,409 - ERROR - Input document 4_2024-01-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\NEE\4_2024-01-29: File format not allowed: data\edgar_documents\NEE\4_2024-01-29
Error processing data\edgar_documents\NEE\4_2024-01-30: File format not allowed: data\edgar_documents\NEE\4_2024-01-30
Converted 'data\edgar_documents\NEE\4_2024-02-07' --> 'data\processed_data\NEE\4_2024-02-07.md'
Converted 'data\edgar_documents\NEE\4_2024-02-16' --> 'data\processed_data\NEE\4_2024-02-16.md'


2025-11-14 17:21:52,607 - INFO - Going to convert document batch...
2025-11-14 17:21:52,608 - INFO - Processing document 4_2024-02-20
2025-11-14 17:21:52,647 - INFO - Finished converting document 4_2024-02-20 in 0.09 sec.
2025-11-14 17:21:52,699 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:52,700 - ERROR - Input document 4_2024-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:21:52,702 - INFO - Going to convert document batch...
2025-11-14 17:21:52,727 - IN

Converted 'data\edgar_documents\NEE\4_2024-02-20' --> 'data\processed_data\NEE\4_2024-02-20.md'
Error processing data\edgar_documents\NEE\4_2024-02-27: File format not allowed: data\edgar_documents\NEE\4_2024-02-27
Error processing data\edgar_documents\NEE\4_2024-02-28: File format not allowed: data\edgar_documents\NEE\4_2024-02-28
Error processing data\edgar_documents\NEE\4_2024-03-04: File format not allowed: data\edgar_documents\NEE\4_2024-03-04
Error processing data\edgar_documents\NEE\4_2024-03-05: File format not allowed: data\edgar_documents\NEE\4_2024-03-05
Converted 'data\edgar_documents\NEE\4_2024-03-13' --> 'data\processed_data\NEE\4_2024-03-13.md'


2025-11-14 17:21:52,867 - INFO - Finished converting document 4_2024-03-18 in 0.03 sec.
2025-11-14 17:21:52,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:52,910 - INFO - Going to convert document batch...
2025-11-14 17:21:52,911 - INFO - Processing document 4_2024-04-05
2025-11-14 17:21:52,934 - INFO - Finished converting document 4_2024-04-05 in 0.05 sec.
2025-11-14 17:21:52,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:52,979 - INFO - Going to convert document batch...
2025-11-14 17:21:52,980 - INFO - Processing document 4_2024-05-07
2025-11-14 17:21:52,998 - INFO - Finished converting document 4_2024-05-07 in 0.05 sec.
2025-11-14 17:21:53,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:53,037 - INFO - Going to convert document batch...
2025-11-14 17:21:53,038 - INFO - Processing document 4_2024-05-08
2025-11-14 17:21:53,058 - INFO - Finished converting document 4_2024-05-08 in 0.05 sec.


Converted 'data\edgar_documents\NEE\4_2024-03-18' --> 'data\processed_data\NEE\4_2024-03-18.md'
Converted 'data\edgar_documents\NEE\4_2024-04-05' --> 'data\processed_data\NEE\4_2024-04-05.md'
Converted 'data\edgar_documents\NEE\4_2024-05-07' --> 'data\processed_data\NEE\4_2024-05-07.md'


2025-11-14 17:21:53,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:53,097 - INFO - Going to convert document batch...
2025-11-14 17:21:53,098 - INFO - Processing document 4_2024-05-16
2025-11-14 17:21:53,125 - INFO - Finished converting document 4_2024-05-16 in 0.05 sec.
2025-11-14 17:21:53,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:53,185 - INFO - Going to convert document batch...
2025-11-14 17:21:53,186 - INFO - Processing document 4_2024-06-04
2025-11-14 17:21:53,211 - INFO - Finished converting document 4_2024-06-04 in 0.05 sec.
2025-11-14 17:21:53,253 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:53,254 - ERROR - Input document 4_2024-06-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\NEE\4_2024-05-08' --> 'data\processed_data\NEE\4_2024-05-08.md'
Converted 'data\edgar_documents\NEE\4_2024-05-16' --> 'data\processed_data\NEE\4_2024-05-16.md'
Converted 'data\edgar_documents\NEE\4_2024-06-04' --> 'data\processed_data\NEE\4_2024-06-04.md'
Error processing data\edgar_documents\NEE\4_2024-06-05: File format not allowed: data\edgar_documents\NEE\4_2024-06-05


2025-11-14 17:21:53,278 - ERROR - Input document 4_2024-06-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:21:53,279 - INFO - Going to convert document batch...
2025-11-14 17:21:53,307 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:53,307 - ERROR - Input document 4_2024-06-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\NEE\4_2024-06-06: File format not allowed: data\edgar_documents\NEE\4_2024-06-06
Error processing data\edgar_documents\NEE\4_2024-06-17: File format not allowed: data\edgar_documents\NEE\4_2024-06-17
Converted 'data\edgar_documents\NEE\4_2024-06-20' --> 'data\processed_data\NEE\4_2024-06-20.md'
Converted 'data\edgar_documents\NEE\4_2024-07-01' --> 'data\processed_data\NEE\4_2024-07-01.md'


2025-11-14 17:21:53,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:53,521 - INFO - Going to convert document batch...
2025-11-14 17:21:53,522 - INFO - Processing document 4_2024-08-01
2025-11-14 17:21:53,544 - INFO - Finished converting document 4_2024-08-01 in 0.05 sec.
2025-11-14 17:21:53,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:53,602 - INFO - Going to convert document batch...
2025-11-14 17:21:53,603 - INFO - Processing document 4_2024-08-06
2025-11-14 17:21:53,621 - INFO - Finished converting document 4_2024-08-06 in 0.06 sec.
2025-11-14 17:21:53,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:53,661 - INFO - Going to convert document batch...
2025-11-14 17:21:53,662 - INFO - Processing document 4_2024-08-27
2025-11-14 17:21:53,684 - INFO - Finished converting document 4_2024-08-27 in 0.05 sec.


Converted 'data\edgar_documents\NEE\4_2024-07-23' --> 'data\processed_data\NEE\4_2024-07-23.md'
Converted 'data\edgar_documents\NEE\4_2024-08-01' --> 'data\processed_data\NEE\4_2024-08-01.md'
Converted 'data\edgar_documents\NEE\4_2024-08-06' --> 'data\processed_data\NEE\4_2024-08-06.md'


2025-11-14 17:21:53,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:53,727 - INFO - Going to convert document batch...
2025-11-14 17:21:53,728 - INFO - Processing document 4_2024-09-17
2025-11-14 17:21:53,752 - INFO - Finished converting document 4_2024-09-17 in 0.05 sec.
2025-11-14 17:21:53,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:53,797 - INFO - Going to convert document batch...
2025-11-14 17:21:53,797 - INFO - Processing document 4_2024-10-02
2025-11-14 17:21:53,819 - INFO - Finished converting document 4_2024-10-02 in 0.03 sec.
2025-11-14 17:21:53,865 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:53,866 - ERROR - Input document 4_2024-10-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\NEE\4_2024-08-27' --> 'data\processed_data\NEE\4_2024-08-27.md'
Converted 'data\edgar_documents\NEE\4_2024-09-17' --> 'data\processed_data\NEE\4_2024-09-17.md'
Converted 'data\edgar_documents\NEE\4_2024-10-02' --> 'data\processed_data\NEE\4_2024-10-02.md'
Error processing data\edgar_documents\NEE\4_2024-10-28: File format not allowed: data\edgar_documents\NEE\4_2024-10-28


2025-11-14 17:21:53,893 - ERROR - Input document 4_2024-10-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:21:53,896 - INFO - Going to convert document batch...
2025-11-14 17:21:53,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:53,915 - INFO - Going to convert document batch...
2025-11-14 17:21:53,915 - INFO - Processing document 4_2024-11-13
2025-11-14 17:21:53,936 - INFO - Finished converting document 4_2024-11-13 in 0.05 sec.
2025-11-14 17:21:53,972 - INFO - detec

Error processing data\edgar_documents\NEE\4_2024-10-29: File format not allowed: data\edgar_documents\NEE\4_2024-10-29
Converted 'data\edgar_documents\NEE\4_2024-11-13' --> 'data\processed_data\NEE\4_2024-11-13.md'
Converted 'data\edgar_documents\NEE\4_2024-11-18' --> 'data\processed_data\NEE\4_2024-11-18.md'
Converted 'data\edgar_documents\NEE\4_2024-12-05' --> 'data\processed_data\NEE\4_2024-12-05.md'


2025-11-14 17:21:54,094 - INFO - Going to convert document batch...
2025-11-14 17:21:54,095 - INFO - Processing document 4_2024-12-18
2025-11-14 17:21:54,113 - INFO - Finished converting document 4_2024-12-18 in 0.03 sec.
2025-11-14 17:21:54,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:54,157 - INFO - Going to convert document batch...
2025-11-14 17:21:54,158 - INFO - Processing document 4_2025-01-07
2025-11-14 17:21:54,177 - INFO - Finished converting document 4_2025-01-07 in 0.03 sec.
2025-11-14 17:21:54,220 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:54,221 - ERROR - Input document 4_2025-01-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\NEE\4_2024-12-18' --> 'data\processed_data\NEE\4_2024-12-18.md'
Converted 'data\edgar_documents\NEE\4_2025-01-07' --> 'data\processed_data\NEE\4_2025-01-07.md'
Error processing data\edgar_documents\NEE\4_2025-01-30: File format not allowed: data\edgar_documents\NEE\4_2025-01-30
Error processing data\edgar_documents\NEE\4_2025-01-31: File format not allowed: data\edgar_documents\NEE\4_2025-01-31
Error processing data\edgar_documents\NEE\4_2025-02-04: File format not allowed: data\edgar_documents\NEE\4_2025-02-04
Error processing data\edgar_documents\NEE\4_2025-02-05: File format not allowed: data\edgar_documents\NEE\4_2025-02-05


2025-11-14 17:21:54,323 - INFO - Processing document 4_2025-02-14
2025-11-14 17:21:54,341 - INFO - Finished converting document 4_2025-02-14 in 0.05 sec.
2025-11-14 17:21:54,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:54,398 - INFO - Going to convert document batch...
2025-11-14 17:21:54,399 - INFO - Processing document 4_2025-02-18
2025-11-14 17:21:54,444 - INFO - Finished converting document 4_2025-02-18 in 0.08 sec.
2025-11-14 17:21:54,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:54,519 - INFO - Going to convert document batch...
2025-11-14 17:21:54,521 - INFO - Processing document 4_2025-02-19
2025-11-14 17:21:54,547 - INFO - Finished converting document 4_2025-02-19 in 0.08 sec.


Converted 'data\edgar_documents\NEE\4_2025-02-14' --> 'data\processed_data\NEE\4_2025-02-14.md'
Converted 'data\edgar_documents\NEE\4_2025-02-18' --> 'data\processed_data\NEE\4_2025-02-18.md'


2025-11-14 17:21:54,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:54,596 - INFO - Going to convert document batch...
2025-11-14 17:21:54,596 - INFO - Processing document 4_2025-02-20
2025-11-14 17:21:54,615 - INFO - Finished converting document 4_2025-02-20 in 0.03 sec.
2025-11-14 17:21:54,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:54,654 - INFO - Going to convert document batch...
2025-11-14 17:21:54,655 - INFO - Processing document 4_2025-03-18
2025-11-14 17:21:54,681 - INFO - Finished converting document 4_2025-03-18 in 0.05 sec.
2025-11-14 17:21:54,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:54,741 - INFO - Going to convert document batch...
2025-11-14 17:21:54,741 - INFO - Processing document 4_2025-04-02
2025-11-14 17:21:54,761 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.


Converted 'data\edgar_documents\NEE\4_2025-02-19' --> 'data\processed_data\NEE\4_2025-02-19.md'
Converted 'data\edgar_documents\NEE\4_2025-02-20' --> 'data\processed_data\NEE\4_2025-02-20.md'
Converted 'data\edgar_documents\NEE\4_2025-03-18' --> 'data\processed_data\NEE\4_2025-03-18.md'


2025-11-14 17:21:54,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:54,804 - INFO - Going to convert document batch...
2025-11-14 17:21:54,805 - INFO - Processing document 4_2025-05-07
2025-11-14 17:21:54,827 - INFO - Finished converting document 4_2025-05-07 in 0.05 sec.
2025-11-14 17:21:54,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:54,879 - INFO - Going to convert document batch...
2025-11-14 17:21:54,879 - INFO - Processing document 4_2025-05-12
2025-11-14 17:21:54,901 - INFO - Finished converting document 4_2025-05-12 in 0.06 sec.
2025-11-14 17:21:54,945 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:54,945 - ERROR - Input document 4_2025-05-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\NEE\4_2025-04-02' --> 'data\processed_data\NEE\4_2025-04-02.md'
Converted 'data\edgar_documents\NEE\4_2025-05-07' --> 'data\processed_data\NEE\4_2025-05-07.md'
Converted 'data\edgar_documents\NEE\4_2025-05-12' --> 'data\processed_data\NEE\4_2025-05-12.md'
Error processing data\edgar_documents\NEE\4_2025-05-14: File format not allowed: data\edgar_documents\NEE\4_2025-05-14


2025-11-14 17:21:54,967 - INFO - Processing document 4_2025-05-16
2025-11-14 17:21:54,985 - INFO - Finished converting document 4_2025-05-16 in 0.05 sec.
2025-11-14 17:21:55,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:55,028 - INFO - Going to convert document batch...
2025-11-14 17:21:55,029 - INFO - Processing document 4_2025-05-19
2025-11-14 17:21:55,047 - INFO - Finished converting document 4_2025-05-19 in 0.05 sec.
2025-11-14 17:21:55,087 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:55,088 - ERROR - Input document 4_2025-06-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\NEE\4_2025-05-16' --> 'data\processed_data\NEE\4_2025-05-16.md'
Converted 'data\edgar_documents\NEE\4_2025-05-19' --> 'data\processed_data\NEE\4_2025-05-19.md'
Error processing data\edgar_documents\NEE\4_2025-06-09: File format not allowed: data\edgar_documents\NEE\4_2025-06-09
Error processing data\edgar_documents\NEE\4_2025-06-11: File format not allowed: data\edgar_documents\NEE\4_2025-06-11
Converted 'data\edgar_documents\NEE\4_2025-06-18' --> 'data\processed_data\NEE\4_2025-06-18.md'


2025-11-14 17:21:55,194 - INFO - Going to convert document batch...
2025-11-14 17:21:55,194 - INFO - Processing document 4_2025-07-02
2025-11-14 17:21:55,215 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 17:21:55,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:55,258 - INFO - Going to convert document batch...
2025-11-14 17:21:55,258 - INFO - Processing document 4_2025-07-23
2025-11-14 17:21:55,281 - INFO - Finished converting document 4_2025-07-23 in 0.05 sec.
2025-11-14 17:21:55,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:55,320 - INFO - Going to convert document batch...
2025-11-14 17:21:55,321 - INFO - Processing document 4_2025-07-29
2025-11-14 17:21:55,339 - INFO - Finished converting document 4_2025-07-29 in 0.05 sec.
2025-11-14 17:21:55,411 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:55,412 - ERROR - Input document 4_2025-07-30 with format None does 

Converted 'data\edgar_documents\NEE\4_2025-07-02' --> 'data\processed_data\NEE\4_2025-07-02.md'
Converted 'data\edgar_documents\NEE\4_2025-07-23' --> 'data\processed_data\NEE\4_2025-07-23.md'
Converted 'data\edgar_documents\NEE\4_2025-07-29' --> 'data\processed_data\NEE\4_2025-07-29.md'
Error processing data\edgar_documents\NEE\4_2025-07-30: File format not allowed: data\edgar_documents\NEE\4_2025-07-30


2025-11-14 17:21:55,436 - INFO - Going to convert document batch...
2025-11-14 17:21:55,437 - INFO - Processing document 4_2025-09-09
2025-11-14 17:21:55,455 - INFO - Finished converting document 4_2025-09-09 in 0.05 sec.
2025-11-14 17:21:55,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:55,499 - INFO - Going to convert document batch...
2025-11-14 17:21:55,499 - INFO - Processing document 4_2025-09-15
2025-11-14 17:21:55,517 - INFO - Finished converting document 4_2025-09-15 in 0.05 sec.
2025-11-14 17:21:55,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:55,556 - INFO - Going to convert document batch...
2025-11-14 17:21:55,557 - INFO - Processing document 4_2025-09-16
2025-11-14 17:21:55,577 - INFO - Finished converting document 4_2025-09-16 in 0.05 sec.
2025-11-14 17:21:55,609 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:55,617 - INFO - Going to convert document batch...
2025-11-14 17:21:55,618 - 

Converted 'data\edgar_documents\NEE\4_2025-09-09' --> 'data\processed_data\NEE\4_2025-09-09.md'
Converted 'data\edgar_documents\NEE\4_2025-09-15' --> 'data\processed_data\NEE\4_2025-09-15.md'
Converted 'data\edgar_documents\NEE\4_2025-09-16' --> 'data\processed_data\NEE\4_2025-09-16.md'
Converted 'data\edgar_documents\NEE\4_2025-09-26' --> 'data\processed_data\NEE\4_2025-09-26.md'


2025-11-14 17:21:55,673 - INFO - Going to convert document batch...
2025-11-14 17:21:55,674 - INFO - Processing document 4_2025-10-02
2025-11-14 17:21:55,693 - INFO - Finished converting document 4_2025-10-02 in 0.03 sec.
2025-11-14 17:21:55,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:55,739 - INFO - Going to convert document batch...
2025-11-14 17:21:55,739 - INFO - Processing document 4_2025-10-06
2025-11-14 17:21:55,763 - INFO - Finished converting document 4_2025-10-06 in 0.05 sec.
2025-11-14 17:21:55,809 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:55,810 - ERROR - Input document 4_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\NEE\4_2025-10-02' --> 'data\processed_data\NEE\4_2025-10-02.md'
Converted 'data\edgar_documents\NEE\4_2025-10-06' --> 'data\processed_data\NEE\4_2025-10-06.md'
Error processing data\edgar_documents\NEE\4_2025-11-03: File format not allowed: data\edgar_documents\NEE\4_2025-11-03
Error processing data\edgar_documents\NEE\4_2025-11-07: File format not allowed: data\edgar_documents\NEE\4_2025-11-07
Converted 'data\edgar_documents\NEE\8-K_2023-01-25' --> 'data\processed_data\NEE\8-K_2023-01-25.md'


2025-11-14 17:21:55,928 - INFO - Going to convert document batch...
2025-11-14 17:21:55,928 - INFO - Processing document 8-K_2023-02-09
2025-11-14 17:21:55,951 - INFO - Finished converting document 8-K_2023-02-09 in 0.06 sec.
2025-11-14 17:21:56,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:56,017 - INFO - Going to convert document batch...
2025-11-14 17:21:56,018 - INFO - Processing document 8-K_2023-03-01
2025-11-14 17:21:56,039 - INFO - Finished converting document 8-K_2023-03-01 in 0.06 sec.
2025-11-14 17:21:56,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:56,081 - INFO - Going to convert document batch...
2025-11-14 17:21:56,082 - INFO - Processing document 8-K_2023-03-03
2025-11-14 17:21:56,109 - INFO - Finished converting document 8-K_2023-03-03 in 0.06 sec.
2025-11-14 17:21:56,161 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\8-K_2023-02-09' --> 'data\processed_data\NEE\8-K_2023-02-09.md'
Converted 'data\edgar_documents\NEE\8-K_2023-03-01' --> 'data\processed_data\NEE\8-K_2023-03-01.md'
Converted 'data\edgar_documents\NEE\8-K_2023-03-03' --> 'data\processed_data\NEE\8-K_2023-03-03.md'


2025-11-14 17:21:56,177 - INFO - Going to convert document batch...
2025-11-14 17:21:56,178 - INFO - Processing document 8-K_2023-03-17
2025-11-14 17:21:56,194 - INFO - Finished converting document 8-K_2023-03-17 in 0.06 sec.
2025-11-14 17:21:56,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:56,251 - INFO - Going to convert document batch...
2025-11-14 17:21:56,252 - INFO - Processing document 8-K_2023-04-25
2025-11-14 17:21:56,278 - INFO - Finished converting document 8-K_2023-04-25 in 0.08 sec.
2025-11-14 17:21:56,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:56,324 - INFO - Going to convert document batch...
2025-11-14 17:21:56,325 - INFO - Processing document 8-K_2023-05-18
2025-11-14 17:21:56,351 - INFO - Finished converting document 8-K_2023-05-18 in 0.05 sec.
2025-11-14 17:21:56,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:56,406 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NEE\8-K_2023-03-17' --> 'data\processed_data\NEE\8-K_2023-03-17.md'
Converted 'data\edgar_documents\NEE\8-K_2023-04-25' --> 'data\processed_data\NEE\8-K_2023-04-25.md'
Converted 'data\edgar_documents\NEE\8-K_2023-05-18' --> 'data\processed_data\NEE\8-K_2023-05-18.md'


2025-11-14 17:21:56,407 - INFO - Processing document 8-K_2023-05-22
2025-11-14 17:21:56,467 - INFO - Finished converting document 8-K_2023-05-22 in 0.11 sec.
2025-11-14 17:21:56,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:56,535 - INFO - Going to convert document batch...
2025-11-14 17:21:56,536 - INFO - Processing document 8-K_2023-06-20
2025-11-14 17:21:56,563 - INFO - Finished converting document 8-K_2023-06-20 in 0.06 sec.
2025-11-14 17:21:56,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:56,607 - INFO - Going to convert document batch...
2025-11-14 17:21:56,608 - INFO - Processing document 8-K_2023-07-25
2025-11-14 17:21:56,632 - INFO - Finished converting document 8-K_2023-07-25 in 0.05 sec.
2025-11-14 17:21:56,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:56,672 - INFO - Going to convert document batch...
2025-11-14 17:21:56,673 - INFO - Processing document 8-K_2023-08-10


Converted 'data\edgar_documents\NEE\8-K_2023-05-22' --> 'data\processed_data\NEE\8-K_2023-05-22.md'
Converted 'data\edgar_documents\NEE\8-K_2023-06-20' --> 'data\processed_data\NEE\8-K_2023-06-20.md'
Converted 'data\edgar_documents\NEE\8-K_2023-07-25' --> 'data\processed_data\NEE\8-K_2023-07-25.md'


2025-11-14 17:21:57,231 - INFO - Finished converting document 8-K_2023-08-10 in 0.59 sec.
2025-11-14 17:21:57,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,271 - INFO - Going to convert document batch...
2025-11-14 17:21:57,272 - INFO - Processing document 8-K_2023-09-25
2025-11-14 17:21:57,290 - INFO - Finished converting document 8-K_2023-09-25 in 0.03 sec.
2025-11-14 17:21:57,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,328 - INFO - Going to convert document batch...
2025-11-14 17:21:57,329 - INFO - Processing document 8-K_2023-10-24
2025-11-14 17:21:57,354 - INFO - Finished converting document 8-K_2023-10-24 in 0.06 sec.
2025-11-14 17:21:57,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,390 - INFO - Going to convert document batch...
2025-11-14 17:21:57,391 - INFO - Processing document 8-K_2023-11-16
2025-11-14 17:21:57,410 - INFO - Finished converting document 8-K_2023-11-16 in 0.

Converted 'data\edgar_documents\NEE\8-K_2023-08-10' --> 'data\processed_data\NEE\8-K_2023-08-10.md'
Converted 'data\edgar_documents\NEE\8-K_2023-09-25' --> 'data\processed_data\NEE\8-K_2023-09-25.md'
Converted 'data\edgar_documents\NEE\8-K_2023-10-24' --> 'data\processed_data\NEE\8-K_2023-10-24.md'
Converted 'data\edgar_documents\NEE\8-K_2023-11-16' --> 'data\processed_data\NEE\8-K_2023-11-16.md'


2025-11-14 17:21:57,447 - INFO - Going to convert document batch...
2025-11-14 17:21:57,448 - INFO - Processing document 8-K_2024-01-25
2025-11-14 17:21:57,474 - INFO - Finished converting document 8-K_2024-01-25 in 0.05 sec.
2025-11-14 17:21:57,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,540 - INFO - Going to convert document batch...
2025-11-14 17:21:57,541 - INFO - Processing document 8-K_2024-01-31
2025-11-14 17:21:57,565 - INFO - Finished converting document 8-K_2024-01-31 in 0.08 sec.
2025-11-14 17:21:57,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,598 - INFO - Going to convert document batch...
2025-11-14 17:21:57,600 - INFO - Processing document 8-K_2024-02-28
2025-11-14 17:21:57,618 - INFO - Finished converting document 8-K_2024-02-28 in 0.03 sec.
2025-11-14 17:21:57,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,650 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\NEE\8-K_2024-01-25' --> 'data\processed_data\NEE\8-K_2024-01-25.md'
Converted 'data\edgar_documents\NEE\8-K_2024-01-31' --> 'data\processed_data\NEE\8-K_2024-01-31.md'
Converted 'data\edgar_documents\NEE\8-K_2024-02-28' --> 'data\processed_data\NEE\8-K_2024-02-28.md'


2025-11-14 17:21:57,672 - INFO - Finished converting document 8-K_2024-03-01 in 0.05 sec.
2025-11-14 17:21:57,696 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,708 - INFO - Going to convert document batch...
2025-11-14 17:21:57,709 - INFO - Processing document 8-K_2024-03-04
2025-11-14 17:21:57,734 - INFO - Finished converting document 8-K_2024-03-04 in 0.05 sec.
2025-11-14 17:21:57,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,770 - INFO - Going to convert document batch...
2025-11-14 17:21:57,771 - INFO - Processing document 8-K_2024-03-07
2025-11-14 17:21:57,789 - INFO - Finished converting document 8-K_2024-03-07 in 0.03 sec.
2025-11-14 17:21:57,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,826 - INFO - Going to convert document batch...
2025-11-14 17:21:57,827 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:21:57,852 - INFO - Finished converting document 8-K_2024-04-23 in 0.

Converted 'data\edgar_documents\NEE\8-K_2024-03-01' --> 'data\processed_data\NEE\8-K_2024-03-01.md'
Converted 'data\edgar_documents\NEE\8-K_2024-03-04' --> 'data\processed_data\NEE\8-K_2024-03-04.md'
Converted 'data\edgar_documents\NEE\8-K_2024-03-07' --> 'data\processed_data\NEE\8-K_2024-03-07.md'
Converted 'data\edgar_documents\NEE\8-K_2024-04-23' --> 'data\processed_data\NEE\8-K_2024-04-23.md'


2025-11-14 17:21:57,890 - INFO - Going to convert document batch...
2025-11-14 17:21:57,892 - INFO - Processing document 8-K_2024-05-06
2025-11-14 17:21:57,913 - INFO - Finished converting document 8-K_2024-05-06 in 0.05 sec.
2025-11-14 17:21:57,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:57,960 - INFO - Going to convert document batch...
2025-11-14 17:21:57,961 - INFO - Processing document 8-K_2024-05-28
2025-11-14 17:21:58,035 - INFO - Finished converting document 8-K_2024-05-28 in 0.11 sec.
2025-11-14 17:21:58,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,084 - INFO - Going to convert document batch...
2025-11-14 17:21:58,084 - INFO - Processing document 8-K_2024-06-03
2025-11-14 17:21:58,109 - INFO - Finished converting document 8-K_2024-06-03 in 0.05 sec.


Converted 'data\edgar_documents\NEE\8-K_2024-05-06' --> 'data\processed_data\NEE\8-K_2024-05-06.md'
Converted 'data\edgar_documents\NEE\8-K_2024-05-28' --> 'data\processed_data\NEE\8-K_2024-05-28.md'


2025-11-14 17:21:58,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,146 - INFO - Going to convert document batch...
2025-11-14 17:21:58,147 - INFO - Processing document 8-K_2024-06-07
2025-11-14 17:21:58,169 - INFO - Finished converting document 8-K_2024-06-07 in 0.05 sec.
2025-11-14 17:21:58,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,205 - INFO - Going to convert document batch...
2025-11-14 17:21:58,206 - INFO - Processing document 8-K_2024-06-11
2025-11-14 17:21:58,224 - INFO - Finished converting document 8-K_2024-06-11 in 0.03 sec.
2025-11-14 17:21:58,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,259 - INFO - Going to convert document batch...
2025-11-14 17:21:58,261 - INFO - Processing document 8-K_2024-06-20
2025-11-14 17:21:58,282 - INFO - Finished converting document 8-K_2024-06-20 in 0.05 sec.
2025-11-14 17:21:58,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NEE\8-K_2024-06-03' --> 'data\processed_data\NEE\8-K_2024-06-03.md'
Converted 'data\edgar_documents\NEE\8-K_2024-06-07' --> 'data\processed_data\NEE\8-K_2024-06-07.md'
Converted 'data\edgar_documents\NEE\8-K_2024-06-11' --> 'data\processed_data\NEE\8-K_2024-06-11.md'
Converted 'data\edgar_documents\NEE\8-K_2024-06-20' --> 'data\processed_data\NEE\8-K_2024-06-20.md'


2025-11-14 17:21:58,318 - INFO - Going to convert document batch...
2025-11-14 17:21:58,319 - INFO - Processing document 8-K_2024-07-01
2025-11-14 17:21:58,348 - INFO - Finished converting document 8-K_2024-07-01 in 0.05 sec.
2025-11-14 17:21:58,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,410 - INFO - Going to convert document batch...
2025-11-14 17:21:58,411 - INFO - Processing document 8-K_2024-07-10
2025-11-14 17:21:58,426 - INFO - Finished converting document 8-K_2024-07-10 in 0.05 sec.
2025-11-14 17:21:58,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,460 - INFO - Going to convert document batch...
2025-11-14 17:21:58,461 - INFO - Processing document 8-K_2024-07-24
2025-11-14 17:21:58,486 - INFO - Finished converting document 8-K_2024-07-24 in 0.05 sec.
2025-11-14 17:21:58,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,527 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\NEE\8-K_2024-07-01' --> 'data\processed_data\NEE\8-K_2024-07-01.md'
Converted 'data\edgar_documents\NEE\8-K_2024-07-10' --> 'data\processed_data\NEE\8-K_2024-07-10.md'
Converted 'data\edgar_documents\NEE\8-K_2024-07-24' --> 'data\processed_data\NEE\8-K_2024-07-24.md'
Converted 'data\edgar_documents\NEE\8-K_2024-07-30' --> 'data\processed_data\NEE\8-K_2024-07-30.md'


2025-11-14 17:21:58,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,617 - INFO - Going to convert document batch...
2025-11-14 17:21:58,618 - INFO - Processing document 8-K_2024-10-23
2025-11-14 17:21:58,643 - INFO - Finished converting document 8-K_2024-10-23 in 0.08 sec.
2025-11-14 17:21:58,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,683 - INFO - Going to convert document batch...
2025-11-14 17:21:58,684 - INFO - Processing document 8-K_2024-10-31
2025-11-14 17:21:58,705 - INFO - Finished converting document 8-K_2024-10-31 in 0.05 sec.
2025-11-14 17:21:58,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,743 - INFO - Going to convert document batch...
2025-11-14 17:21:58,744 - INFO - Processing document 8-K_2024-12-30
2025-11-14 17:21:58,772 - INFO - Finished converting document 8-K_2024-12-30 in 0.05 sec.
2025-11-14 17:21:58,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\NEE\8-K_2024-10-23' --> 'data\processed_data\NEE\8-K_2024-10-23.md'
Converted 'data\edgar_documents\NEE\8-K_2024-10-31' --> 'data\processed_data\NEE\8-K_2024-10-31.md'
Converted 'data\edgar_documents\NEE\8-K_2024-12-30' --> 'data\processed_data\NEE\8-K_2024-12-30.md'


2025-11-14 17:21:58,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,877 - INFO - Going to convert document batch...
2025-11-14 17:21:58,878 - INFO - Processing document 8-K_2025-02-04
2025-11-14 17:21:58,901 - INFO - Finished converting document 8-K_2025-02-04 in 0.05 sec.
2025-11-14 17:21:58,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:58,938 - INFO - Going to convert document batch...
2025-11-14 17:21:58,942 - INFO - Processing document 8-K_2025-02-06
2025-11-14 17:21:58,984 - INFO - Finished converting document 8-K_2025-02-06 in 0.08 sec.
2025-11-14 17:21:59,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,024 - INFO - Going to convert document batch...
2025-11-14 17:21:59,025 - INFO - Processing document 8-K_2025-02-21
2025-11-14 17:21:59,053 - INFO - Finished converting document 8-K_2025-02-21 in 0.05 sec.


Converted 'data\edgar_documents\NEE\8-K_2025-01-24' --> 'data\processed_data\NEE\8-K_2025-01-24.md'
Converted 'data\edgar_documents\NEE\8-K_2025-02-04' --> 'data\processed_data\NEE\8-K_2025-02-04.md'
Converted 'data\edgar_documents\NEE\8-K_2025-02-06' --> 'data\processed_data\NEE\8-K_2025-02-06.md'


2025-11-14 17:21:59,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,094 - INFO - Going to convert document batch...
2025-11-14 17:21:59,095 - INFO - Processing document 8-K_2025-02-28
2025-11-14 17:21:59,119 - INFO - Finished converting document 8-K_2025-02-28 in 0.05 sec.
2025-11-14 17:21:59,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,180 - INFO - Going to convert document batch...
2025-11-14 17:21:59,180 - INFO - Processing document 8-K_2025-03-17
2025-11-14 17:21:59,204 - INFO - Finished converting document 8-K_2025-03-17 in 0.06 sec.
2025-11-14 17:21:59,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,242 - INFO - Going to convert document batch...
2025-11-14 17:21:59,244 - INFO - Processing document 8-K_2025-04-23


Converted 'data\edgar_documents\NEE\8-K_2025-02-21' --> 'data\processed_data\NEE\8-K_2025-02-21.md'
Converted 'data\edgar_documents\NEE\8-K_2025-02-28' --> 'data\processed_data\NEE\8-K_2025-02-28.md'
Converted 'data\edgar_documents\NEE\8-K_2025-03-17' --> 'data\processed_data\NEE\8-K_2025-03-17.md'


2025-11-14 17:21:59,283 - INFO - Finished converting document 8-K_2025-04-23 in 0.06 sec.
2025-11-14 17:21:59,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,333 - INFO - Going to convert document batch...
2025-11-14 17:21:59,334 - INFO - Processing document 8-K_2025-05-15
2025-11-14 17:21:59,355 - INFO - Finished converting document 8-K_2025-05-15 in 0.06 sec.
2025-11-14 17:21:59,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,418 - INFO - Going to convert document batch...
2025-11-14 17:21:59,419 - INFO - Processing document 8-K_2025-05-28
2025-11-14 17:21:59,455 - INFO - Finished converting document 8-K_2025-05-28 in 0.09 sec.


Converted 'data\edgar_documents\NEE\8-K_2025-04-23' --> 'data\processed_data\NEE\8-K_2025-04-23.md'
Converted 'data\edgar_documents\NEE\8-K_2025-05-15' --> 'data\processed_data\NEE\8-K_2025-05-15.md'
Converted 'data\edgar_documents\NEE\8-K_2025-05-28' --> 'data\processed_data\NEE\8-K_2025-05-28.md'


2025-11-14 17:21:59,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,520 - INFO - Going to convert document batch...
2025-11-14 17:21:59,521 - INFO - Processing document 8-K_2025-06-12
2025-11-14 17:21:59,545 - INFO - Finished converting document 8-K_2025-06-12 in 0.08 sec.
2025-11-14 17:21:59,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,588 - INFO - Going to convert document batch...
2025-11-14 17:21:59,589 - INFO - Processing document 8-K_2025-07-23
2025-11-14 17:21:59,613 - INFO - Finished converting document 8-K_2025-07-23 in 0.05 sec.
2025-11-14 17:21:59,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,652 - INFO - Going to convert document batch...
2025-11-14 17:21:59,652 - INFO - Processing document 8-K_2025-08-01
2025-11-14 17:21:59,676 - INFO - Finished converting document 8-K_2025-08-01 in 0.05 sec.
2025-11-14 17:21:59,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\NEE\8-K_2025-06-12' --> 'data\processed_data\NEE\8-K_2025-06-12.md'
Converted 'data\edgar_documents\NEE\8-K_2025-07-23' --> 'data\processed_data\NEE\8-K_2025-07-23.md'
Converted 'data\edgar_documents\NEE\8-K_2025-08-01' --> 'data\processed_data\NEE\8-K_2025-08-01.md'


2025-11-14 17:21:59,779 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:21:59,791 - INFO - Going to convert document batch...
2025-11-14 17:21:59,792 - INFO - Processing document 8-K_2025-10-28
2025-11-14 17:21:59,821 - INFO - Finished converting document 8-K_2025-10-28 in 0.05 sec.


Converted 'data\edgar_documents\NEE\8-K_2025-08-20' --> 'data\processed_data\NEE\8-K_2025-08-20.md'
Converted 'data\edgar_documents\NEE\8-K_2025-10-28' --> 'data\processed_data\NEE\8-K_2025-10-28.md'


2025-11-14 17:21:59,993 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:21:59,994 - ERROR - Input document DEF-14A_2023-04-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:21:59,997 - INFO - Going to convert document batch...
2025-11-14 17:22:00,082 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:22:00,083 - ERROR - Input document DEF-14A_2024-04-01 with format No

Error processing data\edgar_documents\NEE\DEF-14A_2023-04-05: File format not allowed: data\edgar_documents\NEE\DEF-14A_2023-04-05
Error processing data\edgar_documents\NEE\DEF-14A_2024-04-01: File format not allowed: data\edgar_documents\NEE\DEF-14A_2024-04-01
Error processing data\edgar_documents\NEE\DEF-14A_2025-04-01: File format not allowed: data\edgar_documents\NEE\DEF-14A_2025-04-01
Processed 131 new files. Errors: 28
Found 157 files to process in data\edgar_documents\NFLX


2025-11-14 17:22:00,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:00,765 - INFO - Going to convert document batch...
2025-11-14 17:22:00,767 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:22:00,767 - INFO - Processing document 10-K_2023-01-26
2025-11-14 17:22:01,620 - INFO - Finished converting document 10-K_2023-01-26 in 1.45 sec.
2025-11-14 17:22:02,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-K_2023-01-26' --> 'data\processed_data\NFLX\10-K_2023-01-26.md'


2025-11-14 17:22:02,421 - INFO - Going to convert document batch...
2025-11-14 17:22:02,421 - INFO - Processing document 10-K_2024-01-26
2025-11-14 17:22:03,580 - INFO - Finished converting document 10-K_2024-01-26 in 1.59 sec.
2025-11-14 17:22:04,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-K_2024-01-26' --> 'data\processed_data\NFLX\10-K_2024-01-26.md'


2025-11-14 17:22:04,509 - INFO - Going to convert document batch...
2025-11-14 17:22:04,510 - INFO - Processing document 10-K_2025-01-27
2025-11-14 17:22:05,534 - INFO - Finished converting document 10-K_2025-01-27 in 1.48 sec.
2025-11-14 17:22:06,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-K_2025-01-27' --> 'data\processed_data\NFLX\10-K_2025-01-27.md'


2025-11-14 17:22:06,352 - INFO - Going to convert document batch...
2025-11-14 17:22:06,353 - INFO - Processing document 10-Q_2023-04-21
2025-11-14 17:22:07,210 - INFO - Finished converting document 10-Q_2023-04-21 in 1.11 sec.
2025-11-14 17:22:07,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-Q_2023-04-21' --> 'data\processed_data\NFLX\10-Q_2023-04-21.md'


2025-11-14 17:22:07,821 - INFO - Going to convert document batch...
2025-11-14 17:22:07,822 - INFO - Processing document 10-Q_2023-07-21
2025-11-14 17:22:08,502 - INFO - Finished converting document 10-Q_2023-07-21 in 1.02 sec.
2025-11-14 17:22:08,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-Q_2023-07-21' --> 'data\processed_data\NFLX\10-Q_2023-07-21.md'


2025-11-14 17:22:09,242 - INFO - Going to convert document batch...
2025-11-14 17:22:09,243 - INFO - Processing document 10-Q_2023-10-20
2025-11-14 17:22:10,369 - INFO - Finished converting document 10-Q_2023-10-20 in 1.48 sec.
2025-11-14 17:22:10,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-Q_2023-10-20' --> 'data\processed_data\NFLX\10-Q_2023-10-20.md'


2025-11-14 17:22:11,116 - INFO - Going to convert document batch...
2025-11-14 17:22:11,116 - INFO - Processing document 10-Q_2024-04-22
2025-11-14 17:22:11,784 - INFO - Finished converting document 10-Q_2024-04-22 in 0.97 sec.
2025-11-14 17:22:12,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-Q_2024-04-22' --> 'data\processed_data\NFLX\10-Q_2024-04-22.md'


2025-11-14 17:22:12,506 - INFO - Going to convert document batch...
2025-11-14 17:22:12,507 - INFO - Processing document 10-Q_2024-07-19
2025-11-14 17:22:13,732 - INFO - Finished converting document 10-Q_2024-07-19 in 1.62 sec.
2025-11-14 17:22:14,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-Q_2024-07-19' --> 'data\processed_data\NFLX\10-Q_2024-07-19.md'


2025-11-14 17:22:14,604 - INFO - Going to convert document batch...
2025-11-14 17:22:14,605 - INFO - Processing document 10-Q_2024-10-18
2025-11-14 17:22:15,640 - INFO - Finished converting document 10-Q_2024-10-18 in 1.47 sec.
2025-11-14 17:22:16,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-Q_2024-10-18' --> 'data\processed_data\NFLX\10-Q_2024-10-18.md'


2025-11-14 17:22:16,829 - INFO - Going to convert document batch...
2025-11-14 17:22:16,830 - INFO - Processing document 10-Q_2025-04-18
2025-11-14 17:22:17,509 - INFO - Finished converting document 10-Q_2025-04-18 in 1.33 sec.
2025-11-14 17:22:17,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-Q_2025-04-18' --> 'data\processed_data\NFLX\10-Q_2025-04-18.md'


2025-11-14 17:22:18,278 - INFO - Going to convert document batch...
2025-11-14 17:22:18,279 - INFO - Processing document 10-Q_2025-07-18
2025-11-14 17:22:19,181 - INFO - Finished converting document 10-Q_2025-07-18 in 1.31 sec.
2025-11-14 17:22:19,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\10-Q_2025-07-18' --> 'data\processed_data\NFLX\10-Q_2025-07-18.md'


2025-11-14 17:22:20,385 - INFO - Going to convert document batch...
2025-11-14 17:22:20,386 - INFO - Processing document 10-Q_2025-10-22
2025-11-14 17:22:21,329 - INFO - Finished converting document 10-Q_2025-10-22 in 1.67 sec.
2025-11-14 17:22:21,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:21,826 - INFO - Going to convert document batch...
2025-11-14 17:22:21,828 - INFO - Processing document 4_2023-01-04
2025-11-14 17:22:21,848 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 17:22:21,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:21,949 - INFO - Going to convert document batch...
2025-11-14 17:22:21,950 - INFO - Processing document 4_2023-02-01


Converted 'data\edgar_documents\NFLX\10-Q_2025-10-22' --> 'data\processed_data\NFLX\10-Q_2025-10-22.md'
Converted 'data\edgar_documents\NFLX\4_2023-01-04' --> 'data\processed_data\NFLX\4_2023-01-04.md'


2025-11-14 17:22:22,038 - INFO - Finished converting document 4_2023-02-01 in 0.16 sec.
2025-11-14 17:22:22,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,119 - INFO - Going to convert document batch...
2025-11-14 17:22:22,120 - INFO - Processing document 4_2023-02-02
2025-11-14 17:22:22,137 - INFO - Finished converting document 4_2023-02-02 in 0.05 sec.
2025-11-14 17:22:22,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,198 - INFO - Going to convert document batch...
2025-11-14 17:22:22,199 - INFO - Processing document 4_2023-03-02
2025-11-14 17:22:22,216 - INFO - Finished converting document 4_2023-03-02 in 0.06 sec.
2025-11-14 17:22:22,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,254 - INFO - Going to convert document batch...
2025-11-14 17:22:22,255 - INFO - Processing document 4_2023-04-04
2025-11-14 17:22:22,273 - INFO - Finished converting document 4_2023-04-04 in 0.03 sec.
2025-1

Converted 'data\edgar_documents\NFLX\4_2023-02-01' --> 'data\processed_data\NFLX\4_2023-02-01.md'
Converted 'data\edgar_documents\NFLX\4_2023-02-02' --> 'data\processed_data\NFLX\4_2023-02-02.md'
Converted 'data\edgar_documents\NFLX\4_2023-03-02' --> 'data\processed_data\NFLX\4_2023-03-02.md'
Converted 'data\edgar_documents\NFLX\4_2023-04-04' --> 'data\processed_data\NFLX\4_2023-04-04.md'


2025-11-14 17:22:22,317 - INFO - Going to convert document batch...
2025-11-14 17:22:22,318 - INFO - Processing document 4_2023-05-02
2025-11-14 17:22:22,336 - INFO - Finished converting document 4_2023-05-02 in 0.03 sec.
2025-11-14 17:22:22,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,405 - INFO - Going to convert document batch...
2025-11-14 17:22:22,406 - INFO - Processing document 4_2023-05-03
2025-11-14 17:22:22,428 - INFO - Finished converting document 4_2023-05-03 in 0.06 sec.
2025-11-14 17:22:22,482 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,512 - INFO - Going to convert document batch...
2025-11-14 17:22:22,512 - INFO - Processing document 4_2023-05-11
2025-11-14 17:22:22,559 - INFO - Finished converting document 4_2023-05-11 in 0.11 sec.


Converted 'data\edgar_documents\NFLX\4_2023-05-02' --> 'data\processed_data\NFLX\4_2023-05-02.md'
Converted 'data\edgar_documents\NFLX\4_2023-05-03' --> 'data\processed_data\NFLX\4_2023-05-03.md'


2025-11-14 17:22:22,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,625 - INFO - Going to convert document batch...
2025-11-14 17:22:22,626 - INFO - Processing document 4_2023-05-31
2025-11-14 17:22:22,655 - INFO - Finished converting document 4_2023-05-31 in 0.06 sec.
2025-11-14 17:22:22,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,719 - INFO - Going to convert document batch...
2025-11-14 17:22:22,720 - INFO - Processing document 4_2023-06-02
2025-11-14 17:22:22,751 - INFO - Finished converting document 4_2023-06-02 in 0.06 sec.


Converted 'data\edgar_documents\NFLX\4_2023-05-11' --> 'data\processed_data\NFLX\4_2023-05-11.md'
Converted 'data\edgar_documents\NFLX\4_2023-05-31' --> 'data\processed_data\NFLX\4_2023-05-31.md'


2025-11-14 17:22:22,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,799 - INFO - Going to convert document batch...
2025-11-14 17:22:22,800 - INFO - Processing document 4_2023-06-09
2025-11-14 17:22:22,826 - INFO - Finished converting document 4_2023-06-09 in 0.05 sec.
2025-11-14 17:22:22,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,878 - INFO - Going to convert document batch...
2025-11-14 17:22:22,878 - INFO - Processing document 4_2023-07-05
2025-11-14 17:22:22,899 - INFO - Finished converting document 4_2023-07-05 in 0.03 sec.
2025-11-14 17:22:22,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:22,945 - INFO - Going to convert document batch...
2025-11-14 17:22:22,946 - INFO - Processing document 4_2023-07-07
2025-11-14 17:22:22,969 - INFO - Finished converting document 4_2023-07-07 in 0.05 sec.


Converted 'data\edgar_documents\NFLX\4_2023-06-02' --> 'data\processed_data\NFLX\4_2023-06-02.md'
Converted 'data\edgar_documents\NFLX\4_2023-06-09' --> 'data\processed_data\NFLX\4_2023-06-09.md'
Converted 'data\edgar_documents\NFLX\4_2023-07-05' --> 'data\processed_data\NFLX\4_2023-07-05.md'


2025-11-14 17:22:23,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,023 - INFO - Going to convert document batch...
2025-11-14 17:22:23,024 - INFO - Processing document 4_2023-07-11
2025-11-14 17:22:23,047 - INFO - Finished converting document 4_2023-07-11 in 0.05 sec.
2025-11-14 17:22:23,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,116 - INFO - Going to convert document batch...
2025-11-14 17:22:23,117 - INFO - Processing document 4_2023-07-14
2025-11-14 17:22:23,140 - INFO - Finished converting document 4_2023-07-14 in 0.06 sec.
2025-11-14 17:22:23,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\4_2023-07-07' --> 'data\processed_data\NFLX\4_2023-07-07.md'
Converted 'data\edgar_documents\NFLX\4_2023-07-11' --> 'data\processed_data\NFLX\4_2023-07-11.md'
Converted 'data\edgar_documents\NFLX\4_2023-07-14' --> 'data\processed_data\NFLX\4_2023-07-14.md'


2025-11-14 17:22:23,209 - INFO - Going to convert document batch...
2025-11-14 17:22:23,210 - INFO - Processing document 4_2023-07-21
2025-11-14 17:22:23,231 - INFO - Finished converting document 4_2023-07-21 in 0.06 sec.
2025-11-14 17:22:23,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,276 - INFO - Going to convert document batch...
2025-11-14 17:22:23,277 - INFO - Processing document 4_2023-07-28
2025-11-14 17:22:23,304 - INFO - Finished converting document 4_2023-07-28 in 0.05 sec.
2025-11-14 17:22:23,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,356 - INFO - Going to convert document batch...
2025-11-14 17:22:23,356 - INFO - Processing document 4_2023-08-02
2025-11-14 17:22:23,374 - INFO - Finished converting document 4_2023-08-02 in 0.05 sec.
2025-11-14 17:22:23,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,419 - INFO - Going to convert document batch...
2025-11-14 17:22:23,420 - 

Converted 'data\edgar_documents\NFLX\4_2023-07-21' --> 'data\processed_data\NFLX\4_2023-07-21.md'
Converted 'data\edgar_documents\NFLX\4_2023-07-28' --> 'data\processed_data\NFLX\4_2023-07-28.md'
Converted 'data\edgar_documents\NFLX\4_2023-08-02' --> 'data\processed_data\NFLX\4_2023-08-02.md'


2025-11-14 17:22:23,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,522 - INFO - Going to convert document batch...
2025-11-14 17:22:23,524 - INFO - Processing document 4_2023-08-09
2025-11-14 17:22:23,550 - INFO - Finished converting document 4_2023-08-09 in 0.05 sec.
2025-11-14 17:22:23,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,609 - INFO - Going to convert document batch...
2025-11-14 17:22:23,610 - INFO - Processing document 4_2023-09-05
2025-11-14 17:22:23,635 - INFO - Finished converting document 4_2023-09-05 in 0.06 sec.
2025-11-14 17:22:23,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,682 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NFLX\4_2023-08-07' --> 'data\processed_data\NFLX\4_2023-08-07.md'
Converted 'data\edgar_documents\NFLX\4_2023-08-09' --> 'data\processed_data\NFLX\4_2023-08-09.md'
Converted 'data\edgar_documents\NFLX\4_2023-09-05' --> 'data\processed_data\NFLX\4_2023-09-05.md'


2025-11-14 17:22:23,683 - INFO - Processing document 4_2023-09-12
2025-11-14 17:22:23,712 - INFO - Finished converting document 4_2023-09-12 in 0.05 sec.
2025-11-14 17:22:23,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,767 - INFO - Going to convert document batch...
2025-11-14 17:22:23,768 - INFO - Processing document 4_2023-10-03
2025-11-14 17:22:23,804 - INFO - Finished converting document 4_2023-10-03 in 0.06 sec.
2025-11-14 17:22:23,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,873 - INFO - Going to convert document batch...
2025-11-14 17:22:23,875 - INFO - Processing document 4_2023-10-10
2025-11-14 17:22:23,904 - INFO - Finished converting document 4_2023-10-10 in 0.06 sec.


Converted 'data\edgar_documents\NFLX\4_2023-09-12' --> 'data\processed_data\NFLX\4_2023-09-12.md'
Converted 'data\edgar_documents\NFLX\4_2023-10-03' --> 'data\processed_data\NFLX\4_2023-10-03.md'


2025-11-14 17:22:23,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:23,946 - INFO - Going to convert document batch...
2025-11-14 17:22:23,947 - INFO - Processing document 4_2023-11-02
2025-11-14 17:22:23,965 - INFO - Finished converting document 4_2023-11-02 in 0.05 sec.
2025-11-14 17:22:23,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:24,016 - INFO - Going to convert document batch...
2025-11-14 17:22:24,017 - INFO - Processing document 4_2023-11-08
2025-11-14 17:22:24,060 - INFO - Finished converting document 4_2023-11-08 in 0.08 sec.
2025-11-14 17:22:24,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\4_2023-10-10' --> 'data\processed_data\NFLX\4_2023-10-10.md'
Converted 'data\edgar_documents\NFLX\4_2023-11-02' --> 'data\processed_data\NFLX\4_2023-11-02.md'
Converted 'data\edgar_documents\NFLX\4_2023-11-08' --> 'data\processed_data\NFLX\4_2023-11-08.md'


2025-11-14 17:22:24,521 - INFO - Going to convert document batch...
2025-11-14 17:22:24,522 - INFO - Processing document 4_2023-11-09
2025-11-14 17:22:24,548 - INFO - Finished converting document 4_2023-11-09 in 0.45 sec.
2025-11-14 17:22:24,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:24,593 - INFO - Going to convert document batch...
2025-11-14 17:22:24,593 - INFO - Processing document 4_2023-12-04
2025-11-14 17:22:24,612 - INFO - Finished converting document 4_2023-12-04 in 0.03 sec.
2025-11-14 17:22:24,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:24,679 - INFO - Going to convert document batch...
2025-11-14 17:22:24,680 - INFO - Processing document 4_2023-12-12
2025-11-14 17:22:24,738 - INFO - Finished converting document 4_2023-12-12 in 0.11 sec.


Converted 'data\edgar_documents\NFLX\4_2023-11-09' --> 'data\processed_data\NFLX\4_2023-11-09.md'
Converted 'data\edgar_documents\NFLX\4_2023-12-04' --> 'data\processed_data\NFLX\4_2023-12-04.md'


2025-11-14 17:22:24,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:24,813 - INFO - Going to convert document batch...
2025-11-14 17:22:24,814 - INFO - Processing document 4_2023-12-20
2025-11-14 17:22:24,881 - INFO - Finished converting document 4_2023-12-20 in 0.09 sec.
2025-11-14 17:22:24,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:24,953 - INFO - Going to convert document batch...
2025-11-14 17:22:24,954 - INFO - Processing document 4_2023-12-21
2025-11-14 17:22:24,985 - INFO - Finished converting document 4_2023-12-21 in 0.06 sec.


Converted 'data\edgar_documents\NFLX\4_2023-12-12' --> 'data\processed_data\NFLX\4_2023-12-12.md'
Converted 'data\edgar_documents\NFLX\4_2023-12-20' --> 'data\processed_data\NFLX\4_2023-12-20.md'


2025-11-14 17:22:25,023 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,031 - INFO - Going to convert document batch...
2025-11-14 17:22:25,031 - INFO - Processing document 4_2024-01-03
2025-11-14 17:22:25,053 - INFO - Finished converting document 4_2024-01-03 in 0.03 sec.
2025-11-14 17:22:25,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,132 - INFO - Going to convert document batch...
2025-11-14 17:22:25,133 - INFO - Processing document 4_2024-01-26


Converted 'data\edgar_documents\NFLX\4_2023-12-21' --> 'data\processed_data\NFLX\4_2023-12-21.md'
Converted 'data\edgar_documents\NFLX\4_2024-01-03' --> 'data\processed_data\NFLX\4_2024-01-03.md'


2025-11-14 17:22:25,215 - INFO - Finished converting document 4_2024-01-26 in 0.14 sec.
2025-11-14 17:22:25,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,291 - INFO - Going to convert document batch...
2025-11-14 17:22:25,292 - INFO - Processing document 4_2024-01-29
2025-11-14 17:22:25,312 - INFO - Finished converting document 4_2024-01-29 in 0.05 sec.
2025-11-14 17:22:25,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,360 - INFO - Going to convert document batch...
2025-11-14 17:22:25,360 - INFO - Processing document 4_2024-02-02
2025-11-14 17:22:25,394 - INFO - Finished converting document 4_2024-02-02 in 0.06 sec.
2025-11-14 17:22:25,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,446 - INFO - Going to convert document batch...
2025-11-14 17:22:25,446 - INFO - Processing document 4_2024-02-07
2025-11-14 17:22:25,468 - INFO - Finished converting document 4_2024-02-07 in 0.05 sec.


Converted 'data\edgar_documents\NFLX\4_2024-01-26' --> 'data\processed_data\NFLX\4_2024-01-26.md'
Converted 'data\edgar_documents\NFLX\4_2024-01-29' --> 'data\processed_data\NFLX\4_2024-01-29.md'
Converted 'data\edgar_documents\NFLX\4_2024-02-02' --> 'data\processed_data\NFLX\4_2024-02-02.md'


2025-11-14 17:22:25,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,512 - INFO - Going to convert document batch...
2025-11-14 17:22:25,513 - INFO - Processing document 4_2024-02-12
2025-11-14 17:22:25,533 - INFO - Finished converting document 4_2024-02-12 in 0.05 sec.
2025-11-14 17:22:25,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,580 - INFO - Going to convert document batch...
2025-11-14 17:22:25,581 - INFO - Processing document 4_2024-02-28
2025-11-14 17:22:25,602 - INFO - Finished converting document 4_2024-02-28 in 0.03 sec.
2025-11-14 17:22:25,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,643 - INFO - Going to convert document batch...
2025-11-14 17:22:25,644 - INFO - Processing document 4_2024-03-04
2025-11-14 17:22:25,663 - INFO - Finished converting document 4_2024-03-04 in 0.03 sec.


Converted 'data\edgar_documents\NFLX\4_2024-02-07' --> 'data\processed_data\NFLX\4_2024-02-07.md'
Converted 'data\edgar_documents\NFLX\4_2024-02-12' --> 'data\processed_data\NFLX\4_2024-02-12.md'
Converted 'data\edgar_documents\NFLX\4_2024-02-28' --> 'data\processed_data\NFLX\4_2024-02-28.md'


2025-11-14 17:22:25,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,703 - INFO - Going to convert document batch...
2025-11-14 17:22:25,704 - INFO - Processing document 4_2024-03-19
2025-11-14 17:22:25,728 - INFO - Finished converting document 4_2024-03-19 in 0.05 sec.
2025-11-14 17:22:25,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,771 - INFO - Going to convert document batch...
2025-11-14 17:22:25,774 - INFO - Processing document 4_2024-04-02
2025-11-14 17:22:25,819 - INFO - Finished converting document 4_2024-04-02 in 0.06 sec.
2025-11-14 17:22:25,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\4_2024-03-04' --> 'data\processed_data\NFLX\4_2024-03-04.md'
Converted 'data\edgar_documents\NFLX\4_2024-03-19' --> 'data\processed_data\NFLX\4_2024-03-19.md'
Converted 'data\edgar_documents\NFLX\4_2024-04-02' --> 'data\processed_data\NFLX\4_2024-04-02.md'


2025-11-14 17:22:25,864 - INFO - Going to convert document batch...
2025-11-14 17:22:25,865 - INFO - Processing document 4_2024-05-02
2025-11-14 17:22:25,884 - INFO - Finished converting document 4_2024-05-02 in 0.03 sec.
2025-11-14 17:22:25,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:25,941 - INFO - Going to convert document batch...
2025-11-14 17:22:25,942 - INFO - Processing document 4_2024-05-06
2025-11-14 17:22:25,984 - INFO - Finished converting document 4_2024-05-06 in 0.08 sec.
2025-11-14 17:22:26,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,027 - INFO - Going to convert document batch...
2025-11-14 17:22:26,028 - INFO - Processing document 4_2024-05-10
2025-11-14 17:22:26,046 - INFO - Finished converting document 4_2024-05-10 in 0.05 sec.
2025-11-14 17:22:26,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,087 - INFO - Going to convert document batch...
2025-11-14 17:22:26,087 - 

Converted 'data\edgar_documents\NFLX\4_2024-05-02' --> 'data\processed_data\NFLX\4_2024-05-02.md'
Converted 'data\edgar_documents\NFLX\4_2024-05-06' --> 'data\processed_data\NFLX\4_2024-05-06.md'
Converted 'data\edgar_documents\NFLX\4_2024-05-10' --> 'data\processed_data\NFLX\4_2024-05-10.md'


2025-11-14 17:22:26,110 - INFO - Finished converting document 4_2024-05-22 in 0.05 sec.
2025-11-14 17:22:26,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,151 - INFO - Going to convert document batch...
2025-11-14 17:22:26,152 - INFO - Processing document 4_2024-06-04
2025-11-14 17:22:26,170 - INFO - Finished converting document 4_2024-06-04 in 0.05 sec.
2025-11-14 17:22:26,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,216 - INFO - Going to convert document batch...
2025-11-14 17:22:26,217 - INFO - Processing document 4_2024-06-17
2025-11-14 17:22:26,238 - INFO - Finished converting document 4_2024-06-17 in 0.05 sec.
2025-11-14 17:22:26,270 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,279 - INFO - Going to convert document batch...
2025-11-14 17:22:26,280 - INFO - Processing document 4_2024-07-02
2025-11-14 17:22:26,298 - INFO - Finished converting document 4_2024-07-02 in 0.05 sec.


Converted 'data\edgar_documents\NFLX\4_2024-05-22' --> 'data\processed_data\NFLX\4_2024-05-22.md'
Converted 'data\edgar_documents\NFLX\4_2024-06-04' --> 'data\processed_data\NFLX\4_2024-06-04.md'
Converted 'data\edgar_documents\NFLX\4_2024-06-17' --> 'data\processed_data\NFLX\4_2024-06-17.md'


2025-11-14 17:22:26,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,338 - INFO - Going to convert document batch...
2025-11-14 17:22:26,338 - INFO - Processing document 4_2024-07-03
2025-11-14 17:22:26,359 - INFO - Finished converting document 4_2024-07-03 in 0.05 sec.
2025-11-14 17:22:26,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,401 - INFO - Going to convert document batch...
2025-11-14 17:22:26,401 - INFO - Processing document 4_2024-07-26
2025-11-14 17:22:26,422 - INFO - Finished converting document 4_2024-07-26 in 0.05 sec.
2025-11-14 17:22:26,474 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:22:26,474 - ERROR - Input document 4_2024-07-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\NFLX\4_2024-07-02' --> 'data\processed_data\NFLX\4_2024-07-02.md'
Converted 'data\edgar_documents\NFLX\4_2024-07-03' --> 'data\processed_data\NFLX\4_2024-07-03.md'
Converted 'data\edgar_documents\NFLX\4_2024-07-26' --> 'data\processed_data\NFLX\4_2024-07-26.md'
Error processing data\edgar_documents\NFLX\4_2024-07-30: File format not allowed: data\edgar_documents\NFLX\4_2024-07-30


2025-11-14 17:22:26,499 - ERROR - Input document 4_2024-07-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:22:26,499 - INFO - Going to convert document batch...
2025-11-14 17:22:26,512 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,519 - INFO - Going to convert document batch...
2025-11-14 17:22:26,520 - INFO - Processing document 4_2024-08-02
2025-11-14 17:22:26,540 - INFO - Finished converting document 4_2024-08-02 in 0.03 sec.
2025-11-14 17:22:26,591 - INFO - detec

Error processing data\edgar_documents\NFLX\4_2024-07-31: File format not allowed: data\edgar_documents\NFLX\4_2024-07-31
Converted 'data\edgar_documents\NFLX\4_2024-08-02' --> 'data\processed_data\NFLX\4_2024-08-02.md'
Converted 'data\edgar_documents\NFLX\4_2024-08-07' --> 'data\processed_data\NFLX\4_2024-08-07.md'


2025-11-14 17:22:26,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,740 - INFO - Going to convert document batch...
2025-11-14 17:22:26,741 - INFO - Processing document 4_2024-08-14
2025-11-14 17:22:26,807 - INFO - Finished converting document 4_2024-08-14 in 0.11 sec.
2025-11-14 17:22:26,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,878 - INFO - Going to convert document batch...
2025-11-14 17:22:26,879 - INFO - Processing document 4_2024-08-21


Converted 'data\edgar_documents\NFLX\4_2024-08-09' --> 'data\processed_data\NFLX\4_2024-08-09.md'
Converted 'data\edgar_documents\NFLX\4_2024-08-14' --> 'data\processed_data\NFLX\4_2024-08-14.md'


2025-11-14 17:22:26,909 - INFO - Finished converting document 4_2024-08-21 in 0.06 sec.
2025-11-14 17:22:26,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:26,969 - INFO - Going to convert document batch...
2025-11-14 17:22:26,970 - INFO - Processing document 4_2024-09-04
2025-11-14 17:22:26,991 - INFO - Finished converting document 4_2024-09-04 in 0.05 sec.
2025-11-14 17:22:27,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,044 - INFO - Going to convert document batch...
2025-11-14 17:22:27,045 - INFO - Processing document 4_2024-09-13
2025-11-14 17:22:27,094 - INFO - Finished converting document 4_2024-09-13 in 0.08 sec.


Converted 'data\edgar_documents\NFLX\4_2024-08-21' --> 'data\processed_data\NFLX\4_2024-08-21.md'
Converted 'data\edgar_documents\NFLX\4_2024-09-04' --> 'data\processed_data\NFLX\4_2024-09-04.md'


2025-11-14 17:22:27,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,162 - INFO - Going to convert document batch...
2025-11-14 17:22:27,163 - INFO - Processing document 4_2024-09-20
2025-11-14 17:22:27,186 - INFO - Finished converting document 4_2024-09-20 in 0.05 sec.
2025-11-14 17:22:27,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,249 - INFO - Going to convert document batch...
2025-11-14 17:22:27,251 - INFO - Processing document 4_2024-09-26
2025-11-14 17:22:27,278 - INFO - Finished converting document 4_2024-09-26 in 0.08 sec.
2025-11-14 17:22:27,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,319 - INFO - Going to convert document batch...
2025-11-14 17:22:27,320 - INFO - Processing document 4_2024-10-02


Converted 'data\edgar_documents\NFLX\4_2024-09-13' --> 'data\processed_data\NFLX\4_2024-09-13.md'
Converted 'data\edgar_documents\NFLX\4_2024-09-20' --> 'data\processed_data\NFLX\4_2024-09-20.md'
Converted 'data\edgar_documents\NFLX\4_2024-09-26' --> 'data\processed_data\NFLX\4_2024-09-26.md'


2025-11-14 17:22:27,340 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.
2025-11-14 17:22:27,370 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,380 - INFO - Going to convert document batch...
2025-11-14 17:22:27,381 - INFO - Processing document 4_2024-10-11
2025-11-14 17:22:27,402 - INFO - Finished converting document 4_2024-10-11 in 0.05 sec.
2025-11-14 17:22:27,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,450 - INFO - Going to convert document batch...
2025-11-14 17:22:27,451 - INFO - Processing document 4_2024-10-21
2025-11-14 17:22:27,472 - INFO - Finished converting document 4_2024-10-21 in 0.05 sec.
2025-11-14 17:22:27,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,527 - INFO - Going to convert document batch...
2025-11-14 17:22:27,528 - INFO - Processing document 4_2024-10-28


Converted 'data\edgar_documents\NFLX\4_2024-10-02' --> 'data\processed_data\NFLX\4_2024-10-02.md'
Converted 'data\edgar_documents\NFLX\4_2024-10-11' --> 'data\processed_data\NFLX\4_2024-10-11.md'
Converted 'data\edgar_documents\NFLX\4_2024-10-21' --> 'data\processed_data\NFLX\4_2024-10-21.md'


2025-11-14 17:22:27,577 - INFO - Finished converting document 4_2024-10-28 in 0.08 sec.
2025-11-14 17:22:27,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,637 - INFO - Going to convert document batch...
2025-11-14 17:22:27,638 - INFO - Processing document 4_2024-10-30
2025-11-14 17:22:27,655 - INFO - Finished converting document 4_2024-10-30 in 0.05 sec.
2025-11-14 17:22:27,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,696 - INFO - Going to convert document batch...
2025-11-14 17:22:27,696 - INFO - Processing document 4_2024-11-04
2025-11-14 17:22:27,716 - INFO - Finished converting document 4_2024-11-04 in 0.05 sec.
2025-11-14 17:22:27,746 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,756 - INFO - Going to convert document batch...
2025-11-14 17:22:27,756 - INFO - Processing document 4_2024-11-06
2025-11-14 17:22:27,778 - INFO - Finished converting document 4_2024-11-06 in 0.05 sec.


Converted 'data\edgar_documents\NFLX\4_2024-10-28' --> 'data\processed_data\NFLX\4_2024-10-28.md'
Converted 'data\edgar_documents\NFLX\4_2024-10-30' --> 'data\processed_data\NFLX\4_2024-10-30.md'
Converted 'data\edgar_documents\NFLX\4_2024-11-04' --> 'data\processed_data\NFLX\4_2024-11-04.md'
Converted 'data\edgar_documents\NFLX\4_2024-11-06' --> 'data\processed_data\NFLX\4_2024-11-06.md'


2025-11-14 17:22:27,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:27,841 - INFO - Going to convert document batch...
2025-11-14 17:22:27,842 - INFO - Processing document 4_2024-11-07
2025-11-14 17:22:28,100 - INFO - Finished converting document 4_2024-11-07 in 0.30 sec.
2025-11-14 17:22:28,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,147 - INFO - Going to convert document batch...
2025-11-14 17:22:28,147 - INFO - Processing document 4_2024-11-08
2025-11-14 17:22:28,167 - INFO - Finished converting document 4_2024-11-08 in 0.05 sec.
2025-11-14 17:22:28,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,210 - INFO - Going to convert document batch...
2025-11-14 17:22:28,211 - INFO - Processing document 4_2024-11-12
2025-11-14 17:22:28,231 - INFO - Finished converting document 4_2024-11-12 in 0.05 sec.
2025-11-14 17:22:28,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\NFLX\4_2024-11-07' --> 'data\processed_data\NFLX\4_2024-11-07.md'
Converted 'data\edgar_documents\NFLX\4_2024-11-08' --> 'data\processed_data\NFLX\4_2024-11-08.md'
Converted 'data\edgar_documents\NFLX\4_2024-11-12' --> 'data\processed_data\NFLX\4_2024-11-12.md'
Converted 'data\edgar_documents\NFLX\4_2024-11-13' --> 'data\processed_data\NFLX\4_2024-11-13.md'


2025-11-14 17:22:28,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,359 - INFO - Going to convert document batch...
2025-11-14 17:22:28,359 - INFO - Processing document 4_2024-11-18
2025-11-14 17:22:28,384 - INFO - Finished converting document 4_2024-11-18 in 0.06 sec.
2025-11-14 17:22:28,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,438 - INFO - Going to convert document batch...
2025-11-14 17:22:28,439 - INFO - Processing document 4_2024-11-20
2025-11-14 17:22:28,479 - INFO - Finished converting document 4_2024-11-20 in 0.08 sec.
2025-11-14 17:22:28,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,530 - INFO - Going to convert document batch...
2025-11-14 17:22:28,530 - INFO - Processing document 4_2024-12-03
2025-11-14 17:22:28,550 - INFO - Finished converting document 4_2024-12-03 in 0.03 sec.
2025-11-14 17:22:28,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\NFLX\4_2024-11-18' --> 'data\processed_data\NFLX\4_2024-11-18.md'
Converted 'data\edgar_documents\NFLX\4_2024-11-20' --> 'data\processed_data\NFLX\4_2024-11-20.md'
Converted 'data\edgar_documents\NFLX\4_2024-12-03' --> 'data\processed_data\NFLX\4_2024-12-03.md'


2025-11-14 17:22:28,589 - INFO - Processing document 4_2025-01-03
2025-11-14 17:22:28,608 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 17:22:28,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,651 - INFO - Going to convert document batch...
2025-11-14 17:22:28,652 - INFO - Processing document 4_2025-01-06
2025-11-14 17:22:28,672 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 17:22:28,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,712 - INFO - Going to convert document batch...
2025-11-14 17:22:28,713 - INFO - Processing document 4_2025-01-08
2025-11-14 17:22:28,732 - INFO - Finished converting document 4_2025-01-08 in 0.05 sec.
2025-11-14 17:22:28,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,774 - INFO - Going to convert document batch...
2025-11-14 17:22:28,775 - INFO - Processing document 4_2025-01-24
2025-11-14 17:22:28,795 - IN

Converted 'data\edgar_documents\NFLX\4_2025-01-03' --> 'data\processed_data\NFLX\4_2025-01-03.md'
Converted 'data\edgar_documents\NFLX\4_2025-01-06' --> 'data\processed_data\NFLX\4_2025-01-06.md'
Converted 'data\edgar_documents\NFLX\4_2025-01-08' --> 'data\processed_data\NFLX\4_2025-01-08.md'


2025-11-14 17:22:28,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,837 - INFO - Going to convert document batch...
2025-11-14 17:22:28,838 - INFO - Processing document 4_2025-01-28
2025-11-14 17:22:28,861 - INFO - Finished converting document 4_2025-01-28 in 0.05 sec.
2025-11-14 17:22:28,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:28,970 - INFO - Going to convert document batch...
2025-11-14 17:22:28,971 - INFO - Processing document 4_2025-02-03


Converted 'data\edgar_documents\NFLX\4_2025-01-24' --> 'data\processed_data\NFLX\4_2025-01-24.md'
Converted 'data\edgar_documents\NFLX\4_2025-01-28' --> 'data\processed_data\NFLX\4_2025-01-28.md'


2025-11-14 17:22:29,063 - INFO - Finished converting document 4_2025-02-03 in 0.16 sec.
2025-11-14 17:22:29,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:29,192 - INFO - Going to convert document batch...
2025-11-14 17:22:29,193 - INFO - Processing document 4_2025-02-04
2025-11-14 17:22:29,248 - INFO - Finished converting document 4_2025-02-04 in 0.12 sec.
2025-11-14 17:22:29,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\4_2025-02-03' --> 'data\processed_data\NFLX\4_2025-02-03.md'
Converted 'data\edgar_documents\NFLX\4_2025-02-04' --> 'data\processed_data\NFLX\4_2025-02-04.md'


2025-11-14 17:22:29,343 - INFO - Going to convert document batch...
2025-11-14 17:22:29,344 - INFO - Processing document 4_2025-02-05
2025-11-14 17:22:29,368 - INFO - Finished converting document 4_2025-02-05 in 0.06 sec.
2025-11-14 17:22:29,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:29,426 - INFO - Going to convert document batch...
2025-11-14 17:22:29,427 - INFO - Processing document 4_2025-02-06
2025-11-14 17:22:29,453 - INFO - Finished converting document 4_2025-02-06 in 0.06 sec.
2025-11-14 17:22:29,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:29,508 - INFO - Going to convert document batch...
2025-11-14 17:22:29,508 - INFO - Processing document 4_2025-02-07
2025-11-14 17:22:29,560 - INFO - Finished converting document 4_2025-02-07 in 0.09 sec.


Converted 'data\edgar_documents\NFLX\4_2025-02-05' --> 'data\processed_data\NFLX\4_2025-02-05.md'
Converted 'data\edgar_documents\NFLX\4_2025-02-06' --> 'data\processed_data\NFLX\4_2025-02-06.md'


2025-11-14 17:22:29,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:29,620 - INFO - Going to convert document batch...
2025-11-14 17:22:29,621 - INFO - Processing document 4_2025-02-11
2025-11-14 17:22:29,644 - INFO - Finished converting document 4_2025-02-11 in 0.05 sec.
2025-11-14 17:22:29,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:29,692 - INFO - Going to convert document batch...
2025-11-14 17:22:29,693 - INFO - Processing document 4_2025-02-14
2025-11-14 17:22:29,714 - INFO - Finished converting document 4_2025-02-14 in 0.05 sec.
2025-11-14 17:22:29,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:29,761 - INFO - Going to convert document batch...
2025-11-14 17:22:29,761 - INFO - Processing document 4_2025-02-27
2025-11-14 17:22:29,790 - INFO - Finished converting document 4_2025-02-27 in 0.05 sec.


Converted 'data\edgar_documents\NFLX\4_2025-02-07' --> 'data\processed_data\NFLX\4_2025-02-07.md'
Converted 'data\edgar_documents\NFLX\4_2025-02-11' --> 'data\processed_data\NFLX\4_2025-02-11.md'
Converted 'data\edgar_documents\NFLX\4_2025-02-14' --> 'data\processed_data\NFLX\4_2025-02-14.md'


2025-11-14 17:22:29,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:29,837 - INFO - Going to convert document batch...
2025-11-14 17:22:29,838 - INFO - Processing document 4_2025-03-04
2025-11-14 17:22:29,857 - INFO - Finished converting document 4_2025-03-04 in 0.05 sec.
2025-11-14 17:22:29,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:29,902 - INFO - Going to convert document batch...
2025-11-14 17:22:29,904 - INFO - Processing document 4_2025-03-26
2025-11-14 17:22:29,929 - INFO - Finished converting document 4_2025-03-26 in 0.05 sec.
2025-11-14 17:22:29,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:29,974 - INFO - Going to convert document batch...
2025-11-14 17:22:29,975 - INFO - Processing document 4_2025-04-02
2025-11-14 17:22:29,992 - INFO - Finished converting document 4_2025-04-02 in 0.03 sec.


Converted 'data\edgar_documents\NFLX\4_2025-02-27' --> 'data\processed_data\NFLX\4_2025-02-27.md'
Converted 'data\edgar_documents\NFLX\4_2025-03-04' --> 'data\processed_data\NFLX\4_2025-03-04.md'
Converted 'data\edgar_documents\NFLX\4_2025-03-26' --> 'data\processed_data\NFLX\4_2025-03-26.md'


2025-11-14 17:22:30,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:30,036 - INFO - Going to convert document batch...
2025-11-14 17:22:30,036 - INFO - Processing document 4_2025-04-22
2025-11-14 17:22:30,064 - INFO - Finished converting document 4_2025-04-22 in 0.05 sec.
2025-11-14 17:22:30,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:30,130 - INFO - Going to convert document batch...
2025-11-14 17:22:30,131 - INFO - Processing document 4_2025-04-23
2025-11-14 17:22:30,186 - INFO - Finished converting document 4_2025-04-23 in 0.09 sec.


Converted 'data\edgar_documents\NFLX\4_2025-04-02' --> 'data\processed_data\NFLX\4_2025-04-02.md'
Converted 'data\edgar_documents\NFLX\4_2025-04-22' --> 'data\processed_data\NFLX\4_2025-04-22.md'


2025-11-14 17:22:30,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:30,253 - INFO - Going to convert document batch...
2025-11-14 17:22:30,255 - INFO - Processing document 4_2025-04-24
2025-11-14 17:22:30,288 - INFO - Finished converting document 4_2025-04-24 in 0.06 sec.
2025-11-14 17:22:30,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:30,355 - INFO - Going to convert document batch...
2025-11-14 17:22:30,357 - INFO - Processing document 4_2025-04-28
2025-11-14 17:22:30,384 - INFO - Finished converting document 4_2025-04-28 in 0.05 sec.


Converted 'data\edgar_documents\NFLX\4_2025-04-23' --> 'data\processed_data\NFLX\4_2025-04-23.md'
Converted 'data\edgar_documents\NFLX\4_2025-04-24' --> 'data\processed_data\NFLX\4_2025-04-24.md'
Converted 'data\edgar_documents\NFLX\4_2025-04-28' --> 'data\processed_data\NFLX\4_2025-04-28.md'


2025-11-14 17:22:30,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:30,452 - INFO - Going to convert document batch...
2025-11-14 17:22:30,453 - INFO - Processing document 4_2025-04-30
2025-11-14 17:22:30,476 - INFO - Finished converting document 4_2025-04-30 in 0.06 sec.
2025-11-14 17:22:30,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:30,534 - INFO - Going to convert document batch...
2025-11-14 17:22:30,535 - INFO - Processing document 4_2025-05-01
2025-11-14 17:22:30,583 - INFO - Finished converting document 4_2025-05-01 in 0.08 sec.
2025-11-14 17:22:30,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:30,655 - INFO - Going to convert document batch...
2025-11-14 17:22:30,655 - INFO - Processing document 4_2025-05-02
2025-11-14 17:22:30,695 - INFO - Finished converting document 4_2025-05-02 in 0.06 sec.


Converted 'data\edgar_documents\NFLX\4_2025-04-30' --> 'data\processed_data\NFLX\4_2025-04-30.md'
Converted 'data\edgar_documents\NFLX\4_2025-05-01' --> 'data\processed_data\NFLX\4_2025-05-01.md'


2025-11-14 17:22:30,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:30,747 - INFO - Going to convert document batch...
2025-11-14 17:22:30,748 - INFO - Processing document 4_2025-05-05
2025-11-14 17:22:30,769 - INFO - Finished converting document 4_2025-05-05 in 0.05 sec.
2025-11-14 17:22:30,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:30,831 - INFO - Going to convert document batch...
2025-11-14 17:22:30,832 - INFO - Processing document 4_2025-05-07
2025-11-14 17:22:30,863 - INFO - Finished converting document 4_2025-05-07 in 0.06 sec.
2025-11-14 17:22:30,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\4_2025-05-02' --> 'data\processed_data\NFLX\4_2025-05-02.md'
Converted 'data\edgar_documents\NFLX\4_2025-05-05' --> 'data\processed_data\NFLX\4_2025-05-05.md'
Converted 'data\edgar_documents\NFLX\4_2025-05-07' --> 'data\processed_data\NFLX\4_2025-05-07.md'


2025-11-14 17:22:30,941 - INFO - Going to convert document batch...
2025-11-14 17:22:30,941 - INFO - Processing document 4_2025-05-12
2025-11-14 17:22:30,982 - INFO - Finished converting document 4_2025-05-12 in 0.09 sec.
2025-11-14 17:22:31,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:31,046 - INFO - Going to convert document batch...
2025-11-14 17:22:31,047 - INFO - Processing document 4_2025-05-13
2025-11-14 17:22:31,092 - INFO - Finished converting document 4_2025-05-13 in 0.08 sec.
2025-11-14 17:22:31,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:31,166 - INFO - Going to convert document batch...
2025-11-14 17:22:31,167 - INFO - Processing document 4_2025-05-16


Converted 'data\edgar_documents\NFLX\4_2025-05-12' --> 'data\processed_data\NFLX\4_2025-05-12.md'
Converted 'data\edgar_documents\NFLX\4_2025-05-13' --> 'data\processed_data\NFLX\4_2025-05-13.md'


2025-11-14 17:22:31,425 - INFO - Finished converting document 4_2025-05-16 in 0.30 sec.
2025-11-14 17:22:31,460 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:31,472 - INFO - Going to convert document batch...
2025-11-14 17:22:31,473 - INFO - Processing document 4_2025-05-28
2025-11-14 17:22:31,497 - INFO - Finished converting document 4_2025-05-28 in 0.05 sec.
2025-11-14 17:22:31,550 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:31,584 - INFO - Going to convert document batch...
2025-11-14 17:22:31,585 - INFO - Processing document 4_2025-06-02
2025-11-14 17:22:31,647 - INFO - Finished converting document 4_2025-06-02 in 0.12 sec.


Converted 'data\edgar_documents\NFLX\4_2025-05-16' --> 'data\processed_data\NFLX\4_2025-05-16.md'
Converted 'data\edgar_documents\NFLX\4_2025-05-28' --> 'data\processed_data\NFLX\4_2025-05-28.md'


2025-11-14 17:22:31,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:31,740 - INFO - Going to convert document batch...
2025-11-14 17:22:31,741 - INFO - Processing document 4_2025-06-03
2025-11-14 17:22:31,761 - INFO - Finished converting document 4_2025-06-03 in 0.06 sec.
2025-11-14 17:22:31,806 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:31,818 - INFO - Going to convert document batch...
2025-11-14 17:22:31,819 - INFO - Processing document 4_2025-06-04
2025-11-14 17:22:31,843 - INFO - Finished converting document 4_2025-06-04 in 0.06 sec.
2025-11-14 17:22:31,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:31,890 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NFLX\4_2025-06-02' --> 'data\processed_data\NFLX\4_2025-06-02.md'
Converted 'data\edgar_documents\NFLX\4_2025-06-03' --> 'data\processed_data\NFLX\4_2025-06-03.md'
Converted 'data\edgar_documents\NFLX\4_2025-06-04' --> 'data\processed_data\NFLX\4_2025-06-04.md'


2025-11-14 17:22:31,891 - INFO - Processing document 4_2025-06-06
2025-11-14 17:22:31,920 - INFO - Finished converting document 4_2025-06-06 in 0.06 sec.
2025-11-14 17:22:31,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:31,978 - INFO - Going to convert document batch...
2025-11-14 17:22:31,978 - INFO - Processing document 4_2025-06-09
2025-11-14 17:22:32,012 - INFO - Finished converting document 4_2025-06-09 in 0.06 sec.
2025-11-14 17:22:32,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,108 - INFO - Going to convert document batch...
2025-11-14 17:22:32,110 - INFO - Processing document 4_2025-06-25
2025-11-14 17:22:32,163 - INFO - Finished converting document 4_2025-06-25 in 0.11 sec.


Converted 'data\edgar_documents\NFLX\4_2025-06-06' --> 'data\processed_data\NFLX\4_2025-06-06.md'
Converted 'data\edgar_documents\NFLX\4_2025-06-09' --> 'data\processed_data\NFLX\4_2025-06-09.md'


2025-11-14 17:22:32,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,210 - INFO - Going to convert document batch...
2025-11-14 17:22:32,212 - INFO - Processing document 4_2025-06-26
2025-11-14 17:22:32,233 - INFO - Finished converting document 4_2025-06-26 in 0.05 sec.
2025-11-14 17:22:32,270 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,282 - INFO - Going to convert document batch...
2025-11-14 17:22:32,283 - INFO - Processing document 4_2025-07-02
2025-11-14 17:22:32,311 - INFO - Finished converting document 4_2025-07-02 in 0.06 sec.
2025-11-14 17:22:32,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,354 - INFO - Going to convert document batch...
2025-11-14 17:22:32,355 - INFO - Processing document 4_2025-08-04
2025-11-14 17:22:32,372 - INFO - Finished converting document 4_2025-08-04 in 0.05 sec.


Converted 'data\edgar_documents\NFLX\4_2025-06-25' --> 'data\processed_data\NFLX\4_2025-06-25.md'
Converted 'data\edgar_documents\NFLX\4_2025-06-26' --> 'data\processed_data\NFLX\4_2025-06-26.md'
Converted 'data\edgar_documents\NFLX\4_2025-07-02' --> 'data\processed_data\NFLX\4_2025-07-02.md'


2025-11-14 17:22:32,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,416 - INFO - Going to convert document batch...
2025-11-14 17:22:32,416 - INFO - Processing document 4_2025-08-06
2025-11-14 17:22:32,446 - INFO - Finished converting document 4_2025-08-06 in 0.05 sec.
2025-11-14 17:22:32,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,518 - INFO - Going to convert document batch...
2025-11-14 17:22:32,519 - INFO - Processing document 4_2025-09-03
2025-11-14 17:22:32,539 - INFO - Finished converting document 4_2025-09-03 in 0.05 sec.
2025-11-14 17:22:32,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,578 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NFLX\4_2025-08-04' --> 'data\processed_data\NFLX\4_2025-08-04.md'
Converted 'data\edgar_documents\NFLX\4_2025-08-06' --> 'data\processed_data\NFLX\4_2025-08-06.md'
Converted 'data\edgar_documents\NFLX\4_2025-09-03' --> 'data\processed_data\NFLX\4_2025-09-03.md'


2025-11-14 17:22:32,579 - INFO - Processing document 4_2025-10-02
2025-11-14 17:22:32,597 - INFO - Finished converting document 4_2025-10-02 in 0.03 sec.
2025-11-14 17:22:32,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,642 - INFO - Going to convert document batch...
2025-11-14 17:22:32,643 - INFO - Processing document 4_2025-11-04
2025-11-14 17:22:32,663 - INFO - Finished converting document 4_2025-11-04 in 0.03 sec.
2025-11-14 17:22:32,696 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,710 - INFO - Going to convert document batch...
2025-11-14 17:22:32,711 - INFO - Processing document 4_2025-11-05
2025-11-14 17:22:32,739 - INFO - Finished converting document 4_2025-11-05 in 0.05 sec.
2025-11-14 17:22:32,793 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,807 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NFLX\4_2025-10-02' --> 'data\processed_data\NFLX\4_2025-10-02.md'
Converted 'data\edgar_documents\NFLX\4_2025-11-04' --> 'data\processed_data\NFLX\4_2025-11-04.md'
Converted 'data\edgar_documents\NFLX\4_2025-11-05' --> 'data\processed_data\NFLX\4_2025-11-05.md'


2025-11-14 17:22:32,808 - INFO - Processing document 4_2025-11-06
2025-11-14 17:22:32,826 - INFO - Finished converting document 4_2025-11-06 in 0.06 sec.
2025-11-14 17:22:32,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,874 - INFO - Going to convert document batch...
2025-11-14 17:22:32,877 - INFO - Processing document 8-K_2023-01-09
2025-11-14 17:22:32,897 - INFO - Finished converting document 8-K_2023-01-09 in 0.05 sec.
2025-11-14 17:22:32,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:32,949 - INFO - Going to convert document batch...
2025-11-14 17:22:32,950 - INFO - Processing document 8-K_2023-01-19
2025-11-14 17:22:32,969 - INFO - Finished converting document 8-K_2023-01-19 in 0.06 sec.
2025-11-14 17:22:32,993 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,004 - INFO - Going to convert document batch...
2025-11-14 17:22:33,005 - INFO - Processing document 8-K_2023-02-24
2025-11-14 17:22:3

Converted 'data\edgar_documents\NFLX\4_2025-11-06' --> 'data\processed_data\NFLX\4_2025-11-06.md'
Converted 'data\edgar_documents\NFLX\8-K_2023-01-09' --> 'data\processed_data\NFLX\8-K_2023-01-09.md'
Converted 'data\edgar_documents\NFLX\8-K_2023-01-19' --> 'data\processed_data\NFLX\8-K_2023-01-19.md'


2025-11-14 17:22:33,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,055 - INFO - Going to convert document batch...
2025-11-14 17:22:33,057 - INFO - Processing document 8-K_2023-04-18
2025-11-14 17:22:33,071 - INFO - Finished converting document 8-K_2023-04-18 in 0.03 sec.
2025-11-14 17:22:33,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,114 - INFO - Going to convert document batch...
2025-11-14 17:22:33,115 - INFO - Processing document 8-K_2023-06-06
2025-11-14 17:22:33,152 - INFO - Finished converting document 8-K_2023-06-06 in 0.08 sec.
2025-11-14 17:22:33,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,191 - INFO - Going to convert document batch...
2025-11-14 17:22:33,192 - INFO - Processing document 8-K_2023-07-19
2025-11-14 17:22:33,206 - INFO - Finished converting document 8-K_2023-07-19 in 0.03 sec.
2025-11-14 17:22:33,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\8-K_2023-02-24' --> 'data\processed_data\NFLX\8-K_2023-02-24.md'
Converted 'data\edgar_documents\NFLX\8-K_2023-04-18' --> 'data\processed_data\NFLX\8-K_2023-04-18.md'
Converted 'data\edgar_documents\NFLX\8-K_2023-06-06' --> 'data\processed_data\NFLX\8-K_2023-06-06.md'
Converted 'data\edgar_documents\NFLX\8-K_2023-07-19' --> 'data\processed_data\NFLX\8-K_2023-07-19.md'


2025-11-14 17:22:33,239 - INFO - Going to convert document batch...
2025-11-14 17:22:33,239 - INFO - Processing document 8-K_2023-09-08
2025-11-14 17:22:33,251 - INFO - Finished converting document 8-K_2023-09-08 in 0.03 sec.
2025-11-14 17:22:33,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,300 - INFO - Going to convert document batch...
2025-11-14 17:22:33,301 - INFO - Processing document 8-K_2023-10-18
2025-11-14 17:22:33,327 - INFO - Finished converting document 8-K_2023-10-18 in 0.06 sec.
2025-11-14 17:22:33,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,370 - INFO - Going to convert document batch...
2025-11-14 17:22:33,371 - INFO - Processing document 8-K_2023-12-08
2025-11-14 17:22:33,399 - INFO - Finished converting document 8-K_2023-12-08 in 0.05 sec.
2025-11-14 17:22:33,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,441 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\NFLX\8-K_2023-09-08' --> 'data\processed_data\NFLX\8-K_2023-09-08.md'
Converted 'data\edgar_documents\NFLX\8-K_2023-10-18' --> 'data\processed_data\NFLX\8-K_2023-10-18.md'
Converted 'data\edgar_documents\NFLX\8-K_2023-12-08' --> 'data\processed_data\NFLX\8-K_2023-12-08.md'


2025-11-14 17:22:33,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,485 - INFO - Going to convert document batch...
2025-11-14 17:22:33,485 - INFO - Processing document 8-K_2024-04-18
2025-11-14 17:22:33,500 - INFO - Finished converting document 8-K_2024-04-18 in 0.03 sec.
2025-11-14 17:22:33,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,541 - INFO - Going to convert document batch...
2025-11-14 17:22:33,542 - INFO - Processing document 8-K_2024-06-07
2025-11-14 17:22:33,580 - INFO - Finished converting document 8-K_2024-06-07 in 0.06 sec.
2025-11-14 17:22:33,609 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,617 - INFO - Going to convert document batch...
2025-11-14 17:22:33,618 - INFO - Processing document 8-K_2024-07-18
2025-11-14 17:22:33,632 - INFO - Finished converting document 8-K_2024-07-18 in 0.03 sec.
2025-11-14 17:22:33,656 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_ja

Converted 'data\edgar_documents\NFLX\8-K_2024-01-23' --> 'data\processed_data\NFLX\8-K_2024-01-23.md'
Converted 'data\edgar_documents\NFLX\8-K_2024-04-18' --> 'data\processed_data\NFLX\8-K_2024-04-18.md'
Converted 'data\edgar_documents\NFLX\8-K_2024-06-07' --> 'data\processed_data\NFLX\8-K_2024-06-07.md'
Converted 'data\edgar_documents\NFLX\8-K_2024-07-18' --> 'data\processed_data\NFLX\8-K_2024-07-18.md'


2025-11-14 17:22:33,657 - ERROR - Input document 8-K_2024-08-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:22:33,658 - INFO - Going to convert document batch...
2025-11-14 17:22:33,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,676 - INFO - Going to convert document batch...
2025-11-14 17:22:33,677 - INFO - Processing document 8-K_2024-10-17
2025-11-14 17:22:33,692 - INFO - Finished converting document 8-K_2024-10-17 in 0.03 sec.
2025-11-14 17:22:33,714 - INFO -

Error processing data\edgar_documents\NFLX\8-K_2024-08-01: File format not allowed: data\edgar_documents\NFLX\8-K_2024-08-01
Converted 'data\edgar_documents\NFLX\8-K_2024-10-17' --> 'data\processed_data\NFLX\8-K_2024-10-17.md'
Converted 'data\edgar_documents\NFLX\8-K_2025-01-21' --> 'data\processed_data\NFLX\8-K_2025-01-21.md'
Converted 'data\edgar_documents\NFLX\8-K_2025-04-17' --> 'data\processed_data\NFLX\8-K_2025-04-17.md'


2025-11-14 17:22:33,890 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,898 - INFO - Going to convert document batch...
2025-11-14 17:22:33,899 - INFO - Processing document 8-K_2025-06-24
2025-11-14 17:22:33,916 - INFO - Finished converting document 8-K_2025-06-24 in 0.03 sec.
2025-11-14 17:22:33,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:33,960 - INFO - Going to convert document batch...
2025-11-14 17:22:33,962 - INFO - Processing document 8-K_2025-07-17
2025-11-14 17:22:33,990 - INFO - Finished converting document 8-K_2025-07-17 in 0.06 sec.
2025-11-14 17:22:34,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:34,024 - INFO - Going to convert document batch...
2025-11-14 17:22:34,025 - INFO - Processing document 8-K_2025-10-21
2025-11-14 17:22:34,038 - INFO - Finished converting document 8-K_2025-10-21 in 0.03 sec.
2025-11-14 17:22:34,059 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NFLX\8-K_2025-06-06' --> 'data\processed_data\NFLX\8-K_2025-06-06.md'
Converted 'data\edgar_documents\NFLX\8-K_2025-06-24' --> 'data\processed_data\NFLX\8-K_2025-06-24.md'
Converted 'data\edgar_documents\NFLX\8-K_2025-07-17' --> 'data\processed_data\NFLX\8-K_2025-07-17.md'
Converted 'data\edgar_documents\NFLX\8-K_2025-10-21' --> 'data\processed_data\NFLX\8-K_2025-10-21.md'


2025-11-14 17:22:34,067 - INFO - Going to convert document batch...
2025-11-14 17:22:34,068 - INFO - Processing document 8-K_2025-10-30
2025-11-14 17:22:34,081 - INFO - Finished converting document 8-K_2025-10-30 in 0.03 sec.
2025-11-14 17:22:34,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:34,116 - INFO - Going to convert document batch...
2025-11-14 17:22:34,117 - INFO - Processing document 8-K_2025-11-04
2025-11-14 17:22:34,140 - INFO - Finished converting document 8-K_2025-11-04 in 0.05 sec.
2025-11-14 17:22:34,240 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:22:34,241 - ERROR - Input document DEF-14A_2023-04-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputForm

Converted 'data\edgar_documents\NFLX\8-K_2025-10-30' --> 'data\processed_data\NFLX\8-K_2025-10-30.md'
Converted 'data\edgar_documents\NFLX\8-K_2025-11-04' --> 'data\processed_data\NFLX\8-K_2025-11-04.md'
Error processing data\edgar_documents\NFLX\DEF-14A_2023-04-21: File format not allowed: data\edgar_documents\NFLX\DEF-14A_2023-04-21


2025-11-14 17:22:34,306 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:22:34,307 - ERROR - Input document DEF-14A_2024-04-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:22:34,310 - INFO - Going to convert document batch...
2025-11-14 17:22:34,346 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:22:34,347 - ERROR - Input document DEF-14A_2025-04-17 with format No

Error processing data\edgar_documents\NFLX\DEF-14A_2024-04-18: File format not allowed: data\edgar_documents\NFLX\DEF-14A_2024-04-18
Error processing data\edgar_documents\NFLX\DEF-14A_2025-04-17: File format not allowed: data\edgar_documents\NFLX\DEF-14A_2025-04-17
Processed 151 new files. Errors: 6
Found 105 files to process in data\edgar_documents\NKE


2025-11-14 17:22:35,173 - INFO - Going to convert document batch...
2025-11-14 17:22:35,174 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:22:35,175 - INFO - Processing document 10-K_2023-07-20
2025-11-14 17:22:36,587 - INFO - Finished converting document 10-K_2023-07-20 in 2.22 sec.
2025-11-14 17:22:37,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-K_2023-07-20' --> 'data\processed_data\NKE\10-K_2023-07-20.md'


2025-11-14 17:22:37,839 - INFO - Going to convert document batch...
2025-11-14 17:22:37,840 - INFO - Processing document 10-K_2024-07-25
2025-11-14 17:22:39,102 - INFO - Finished converting document 10-K_2024-07-25 in 2.03 sec.
2025-11-14 17:22:39,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-K_2024-07-25' --> 'data\processed_data\NKE\10-K_2024-07-25.md'


2025-11-14 17:22:40,485 - INFO - Going to convert document batch...
2025-11-14 17:22:40,486 - INFO - Processing document 10-K_2025-07-17
2025-11-14 17:22:41,896 - INFO - Finished converting document 10-K_2025-07-17 in 2.31 sec.
2025-11-14 17:22:42,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-K_2025-07-17' --> 'data\processed_data\NKE\10-K_2025-07-17.md'


2025-11-14 17:22:42,902 - INFO - Going to convert document batch...
2025-11-14 17:22:42,903 - INFO - Processing document 10-Q_2023-01-05
2025-11-14 17:22:43,745 - INFO - Finished converting document 10-Q_2023-01-05 in 1.36 sec.
2025-11-14 17:22:44,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-Q_2023-01-05' --> 'data\processed_data\NKE\10-Q_2023-01-05.md'


2025-11-14 17:22:45,047 - INFO - Going to convert document batch...
2025-11-14 17:22:45,048 - INFO - Processing document 10-Q_2023-04-06
2025-11-14 17:22:45,883 - INFO - Finished converting document 10-Q_2023-04-06 in 1.75 sec.
2025-11-14 17:22:46,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-Q_2023-04-06' --> 'data\processed_data\NKE\10-Q_2023-04-06.md'


2025-11-14 17:22:46,609 - INFO - Going to convert document batch...
2025-11-14 17:22:46,610 - INFO - Processing document 10-Q_2023-10-06
2025-11-14 17:22:47,178 - INFO - Finished converting document 10-Q_2023-10-06 in 0.89 sec.
2025-11-14 17:22:47,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-Q_2023-10-06' --> 'data\processed_data\NKE\10-Q_2023-10-06.md'


2025-11-14 17:22:48,263 - INFO - Going to convert document batch...
2025-11-14 17:22:48,264 - INFO - Processing document 10-Q_2024-01-05
2025-11-14 17:22:49,049 - INFO - Finished converting document 10-Q_2024-01-05 in 1.59 sec.
2025-11-14 17:22:49,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-Q_2024-01-05' --> 'data\processed_data\NKE\10-Q_2024-01-05.md'


2025-11-14 17:22:50,177 - INFO - Going to convert document batch...
2025-11-14 17:22:50,178 - INFO - Processing document 10-Q_2024-04-04
2025-11-14 17:22:50,974 - INFO - Finished converting document 10-Q_2024-04-04 in 1.56 sec.
2025-11-14 17:22:51,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-Q_2024-04-04' --> 'data\processed_data\NKE\10-Q_2024-04-04.md'


2025-11-14 17:22:51,655 - INFO - Going to convert document batch...
2025-11-14 17:22:51,656 - INFO - Processing document 10-Q_2024-10-07
2025-11-14 17:22:52,209 - INFO - Finished converting document 10-Q_2024-10-07 in 0.86 sec.
2025-11-14 17:22:52,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-Q_2024-10-07' --> 'data\processed_data\NKE\10-Q_2024-10-07.md'


2025-11-14 17:22:53,287 - INFO - Going to convert document batch...
2025-11-14 17:22:53,288 - INFO - Processing document 10-Q_2025-01-03
2025-11-14 17:22:54,036 - INFO - Finished converting document 10-Q_2025-01-03 in 1.55 sec.
2025-11-14 17:22:54,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-Q_2025-01-03' --> 'data\processed_data\NKE\10-Q_2025-01-03.md'


2025-11-14 17:22:54,830 - INFO - Going to convert document batch...
2025-11-14 17:22:54,831 - INFO - Processing document 10-Q_2025-04-03
2025-11-14 17:22:55,877 - INFO - Finished converting document 10-Q_2025-04-03 in 1.52 sec.
2025-11-14 17:22:56,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-Q_2025-04-03' --> 'data\processed_data\NKE\10-Q_2025-04-03.md'


2025-11-14 17:22:56,642 - INFO - Going to convert document batch...
2025-11-14 17:22:56,642 - INFO - Processing document 10-Q_2025-10-01
2025-11-14 17:22:57,237 - INFO - Finished converting document 10-Q_2025-10-01 in 0.97 sec.
2025-11-14 17:22:57,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:57,561 - INFO - Going to convert document batch...
2025-11-14 17:22:57,562 - INFO - Processing document 4_2023-01-09
2025-11-14 17:22:57,588 - INFO - Finished converting document 4_2023-01-09 in 0.05 sec.
2025-11-14 17:22:57,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:57,653 - INFO - Going to convert document batch...
2025-11-14 17:22:57,654 - INFO - Processing document 4_2023-01-18
2025-11-14 17:22:57,673 - INFO - Finished converting document 4_2023-01-18 in 0.06 sec.
2025-11-14 17:22:57,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\10-Q_2025-10-01' --> 'data\processed_data\NKE\10-Q_2025-10-01.md'
Converted 'data\edgar_documents\NKE\4_2023-01-09' --> 'data\processed_data\NKE\4_2023-01-09.md'
Converted 'data\edgar_documents\NKE\4_2023-01-18' --> 'data\processed_data\NKE\4_2023-01-18.md'


2025-11-14 17:22:57,731 - INFO - Going to convert document batch...
2025-11-14 17:22:57,732 - INFO - Processing document 4_2023-02-08
2025-11-14 17:22:57,750 - INFO - Finished converting document 4_2023-02-08 in 0.06 sec.
2025-11-14 17:22:57,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:57,789 - INFO - Going to convert document batch...
2025-11-14 17:22:57,790 - INFO - Processing document 4_2023-02-14
2025-11-14 17:22:57,808 - INFO - Finished converting document 4_2023-02-14 in 0.05 sec.
2025-11-14 17:22:57,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:57,852 - INFO - Going to convert document batch...
2025-11-14 17:22:57,853 - INFO - Processing document 4_2023-04-10
2025-11-14 17:22:57,883 - INFO - Finished converting document 4_2023-04-10 in 0.05 sec.
2025-11-14 17:22:57,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:57,938 - INFO - Going to convert document batch...
2025-11-14 17:22:57,938 - 

Converted 'data\edgar_documents\NKE\4_2023-02-08' --> 'data\processed_data\NKE\4_2023-02-08.md'
Converted 'data\edgar_documents\NKE\4_2023-02-14' --> 'data\processed_data\NKE\4_2023-02-14.md'
Converted 'data\edgar_documents\NKE\4_2023-04-10' --> 'data\processed_data\NKE\4_2023-04-10.md'


2025-11-14 17:22:57,961 - INFO - Finished converting document 4_2023-04-18 in 0.05 sec.
2025-11-14 17:22:58,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,011 - INFO - Going to convert document batch...
2025-11-14 17:22:58,013 - INFO - Processing document 4_2023-05-15
2025-11-14 17:22:58,042 - INFO - Finished converting document 4_2023-05-15 in 0.06 sec.
2025-11-14 17:22:58,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,109 - INFO - Going to convert document batch...
2025-11-14 17:22:58,111 - INFO - Processing document 4_2023-06-05
2025-11-14 17:22:58,140 - INFO - Finished converting document 4_2023-06-05 in 0.06 sec.


Converted 'data\edgar_documents\NKE\4_2023-04-18' --> 'data\processed_data\NKE\4_2023-04-18.md'
Converted 'data\edgar_documents\NKE\4_2023-05-15' --> 'data\processed_data\NKE\4_2023-05-15.md'


2025-11-14 17:22:58,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,186 - INFO - Going to convert document batch...
2025-11-14 17:22:58,187 - INFO - Processing document 4_2023-06-07
2025-11-14 17:22:58,207 - INFO - Finished converting document 4_2023-06-07 in 0.03 sec.
2025-11-14 17:22:58,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,259 - INFO - Going to convert document batch...
2025-11-14 17:22:58,260 - INFO - Processing document 4_2023-07-14
2025-11-14 17:22:58,283 - INFO - Finished converting document 4_2023-07-14 in 0.05 sec.
2025-11-14 17:22:58,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,353 - INFO - Going to convert document batch...
2025-11-14 17:22:58,353 - INFO - Processing document 4_2023-07-17


Converted 'data\edgar_documents\NKE\4_2023-06-05' --> 'data\processed_data\NKE\4_2023-06-05.md'
Converted 'data\edgar_documents\NKE\4_2023-06-07' --> 'data\processed_data\NKE\4_2023-06-07.md'
Converted 'data\edgar_documents\NKE\4_2023-07-14' --> 'data\processed_data\NKE\4_2023-07-14.md'


2025-11-14 17:22:58,370 - INFO - Finished converting document 4_2023-07-17 in 0.06 sec.
2025-11-14 17:22:58,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,417 - INFO - Going to convert document batch...
2025-11-14 17:22:58,418 - INFO - Processing document 4_2023-07-19
2025-11-14 17:22:58,453 - INFO - Finished converting document 4_2023-07-19 in 0.06 sec.
2025-11-14 17:22:58,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,519 - INFO - Going to convert document batch...
2025-11-14 17:22:58,521 - INFO - Processing document 4_2023-08-03
2025-11-14 17:22:58,563 - INFO - Finished converting document 4_2023-08-03 in 0.08 sec.


Converted 'data\edgar_documents\NKE\4_2023-07-17' --> 'data\processed_data\NKE\4_2023-07-17.md'
Converted 'data\edgar_documents\NKE\4_2023-07-19' --> 'data\processed_data\NKE\4_2023-07-19.md'
Converted 'data\edgar_documents\NKE\4_2023-08-03' --> 'data\processed_data\NKE\4_2023-08-03.md'


2025-11-14 17:22:58,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,638 - INFO - Going to convert document batch...
2025-11-14 17:22:58,639 - INFO - Processing document 4_2023-08-07
2025-11-14 17:22:58,666 - INFO - Finished converting document 4_2023-08-07 in 0.06 sec.
2025-11-14 17:22:58,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,749 - INFO - Going to convert document batch...
2025-11-14 17:22:58,750 - INFO - Processing document 4_2023-08-09
2025-11-14 17:22:58,802 - INFO - Finished converting document 4_2023-08-09 in 0.09 sec.
2025-11-14 17:22:58,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,871 - INFO - Going to convert document batch...
2025-11-14 17:22:58,872 - INFO - Processing document 4_2023-08-22
2025-11-14 17:22:58,909 - INFO - Finished converting document 4_2023-08-22 in 0.06 sec.


Converted 'data\edgar_documents\NKE\4_2023-08-07' --> 'data\processed_data\NKE\4_2023-08-07.md'
Converted 'data\edgar_documents\NKE\4_2023-08-09' --> 'data\processed_data\NKE\4_2023-08-09.md'


2025-11-14 17:22:58,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:58,969 - INFO - Going to convert document batch...
2025-11-14 17:22:58,970 - INFO - Processing document 4_2023-09-12
2025-11-14 17:22:58,990 - INFO - Finished converting document 4_2023-09-12 in 0.05 sec.
2025-11-14 17:22:59,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,036 - INFO - Going to convert document batch...
2025-11-14 17:22:59,037 - INFO - Processing document 4_2023-09-14
2025-11-14 17:22:59,056 - INFO - Finished converting document 4_2023-09-14 in 0.03 sec.
2025-11-14 17:22:59,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,097 - INFO - Going to convert document batch...
2025-11-14 17:22:59,098 - INFO - Processing document 4_2023-10-03
2025-11-14 17:22:59,118 - INFO - Finished converting document 4_2023-10-03 in 0.03 sec.


Converted 'data\edgar_documents\NKE\4_2023-08-22' --> 'data\processed_data\NKE\4_2023-08-22.md'
Converted 'data\edgar_documents\NKE\4_2023-09-12' --> 'data\processed_data\NKE\4_2023-09-12.md'
Converted 'data\edgar_documents\NKE\4_2023-09-14' --> 'data\processed_data\NKE\4_2023-09-14.md'


2025-11-14 17:22:59,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,160 - INFO - Going to convert document batch...
2025-11-14 17:22:59,161 - INFO - Processing document 4_2023-10-13
2025-11-14 17:22:59,185 - INFO - Finished converting document 4_2023-10-13 in 0.05 sec.
2025-11-14 17:22:59,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,234 - INFO - Going to convert document batch...
2025-11-14 17:22:59,235 - INFO - Processing document 4_2023-10-17
2025-11-14 17:22:59,266 - INFO - Finished converting document 4_2023-10-17 in 0.06 sec.
2025-11-14 17:22:59,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,310 - INFO - Going to convert document batch...
2025-11-14 17:22:59,310 - INFO - Processing document 4_2023-12-13
2025-11-14 17:22:59,335 - INFO - Finished converting document 4_2023-12-13 in 0.05 sec.


Converted 'data\edgar_documents\NKE\4_2023-10-03' --> 'data\processed_data\NKE\4_2023-10-03.md'
Converted 'data\edgar_documents\NKE\4_2023-10-13' --> 'data\processed_data\NKE\4_2023-10-13.md'
Converted 'data\edgar_documents\NKE\4_2023-10-17' --> 'data\processed_data\NKE\4_2023-10-17.md'


2025-11-14 17:22:59,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,380 - INFO - Going to convert document batch...
2025-11-14 17:22:59,381 - INFO - Processing document 4_2024-01-12
2025-11-14 17:22:59,399 - INFO - Finished converting document 4_2024-01-12 in 0.03 sec.
2025-11-14 17:22:59,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,444 - INFO - Going to convert document batch...
2025-11-14 17:22:59,445 - INFO - Processing document 4_2024-02-13
2025-11-14 17:22:59,467 - INFO - Finished converting document 4_2024-02-13 in 0.05 sec.
2025-11-14 17:22:59,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,514 - INFO - Going to convert document batch...
2025-11-14 17:22:59,515 - INFO - Processing document 4_2024-02-16
2025-11-14 17:22:59,542 - INFO - Finished converting document 4_2024-02-16 in 0.06 sec.


Converted 'data\edgar_documents\NKE\4_2023-12-13' --> 'data\processed_data\NKE\4_2023-12-13.md'
Converted 'data\edgar_documents\NKE\4_2024-01-12' --> 'data\processed_data\NKE\4_2024-01-12.md'
Converted 'data\edgar_documents\NKE\4_2024-02-13' --> 'data\processed_data\NKE\4_2024-02-13.md'


2025-11-14 17:22:59,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,590 - INFO - Going to convert document batch...
2025-11-14 17:22:59,591 - INFO - Processing document 4_2024-05-08
2025-11-14 17:22:59,625 - INFO - Finished converting document 4_2024-05-08 in 0.06 sec.
2025-11-14 17:22:59,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,682 - INFO - Going to convert document batch...
2025-11-14 17:22:59,683 - INFO - Processing document 4_2024-05-10
2025-11-14 17:22:59,704 - INFO - Finished converting document 4_2024-05-10 in 0.05 sec.
2025-11-14 17:22:59,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,749 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NKE\4_2024-02-16' --> 'data\processed_data\NKE\4_2024-02-16.md'
Converted 'data\edgar_documents\NKE\4_2024-05-08' --> 'data\processed_data\NKE\4_2024-05-08.md'
Converted 'data\edgar_documents\NKE\4_2024-05-10' --> 'data\processed_data\NKE\4_2024-05-10.md'


2025-11-14 17:22:59,749 - INFO - Processing document 4_2024-05-15
2025-11-14 17:22:59,780 - INFO - Finished converting document 4_2024-05-15 in 0.06 sec.
2025-11-14 17:22:59,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,830 - INFO - Going to convert document batch...
2025-11-14 17:22:59,831 - INFO - Processing document 4_2024-06-05
2025-11-14 17:22:59,848 - INFO - Finished converting document 4_2024-06-05 in 0.03 sec.
2025-11-14 17:22:59,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,896 - INFO - Going to convert document batch...
2025-11-14 17:22:59,898 - INFO - Processing document 4_2024-06-07
2025-11-14 17:22:59,916 - INFO - Finished converting document 4_2024-06-07 in 0.05 sec.
2025-11-14 17:22:59,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:22:59,968 - INFO - Going to convert document batch...
2025-11-14 17:22:59,969 - INFO - Processing document 4_2024-07-01
2025-11-14 17:23:00,416 - IN

Converted 'data\edgar_documents\NKE\4_2024-05-15' --> 'data\processed_data\NKE\4_2024-05-15.md'
Converted 'data\edgar_documents\NKE\4_2024-06-05' --> 'data\processed_data\NKE\4_2024-06-05.md'
Converted 'data\edgar_documents\NKE\4_2024-06-07' --> 'data\processed_data\NKE\4_2024-06-07.md'


2025-11-14 17:23:00,471 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:00,482 - INFO - Going to convert document batch...
2025-11-14 17:23:00,483 - INFO - Processing document 4_2024-07-11
2025-11-14 17:23:00,506 - INFO - Finished converting document 4_2024-07-11 in 0.06 sec.
2025-11-14 17:23:00,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:00,559 - INFO - Going to convert document batch...
2025-11-14 17:23:00,559 - INFO - Processing document 4_2024-07-12
2025-11-14 17:23:00,582 - INFO - Finished converting document 4_2024-07-12 in 0.05 sec.
2025-11-14 17:23:00,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\4_2024-07-01' --> 'data\processed_data\NKE\4_2024-07-01.md'
Converted 'data\edgar_documents\NKE\4_2024-07-11' --> 'data\processed_data\NKE\4_2024-07-11.md'
Converted 'data\edgar_documents\NKE\4_2024-07-12' --> 'data\processed_data\NKE\4_2024-07-12.md'


2025-11-14 17:23:00,641 - INFO - Going to convert document batch...
2025-11-14 17:23:00,643 - INFO - Processing document 4_2024-07-22
2025-11-14 17:23:00,667 - INFO - Finished converting document 4_2024-07-22 in 0.08 sec.
2025-11-14 17:23:00,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:00,733 - INFO - Going to convert document batch...
2025-11-14 17:23:00,735 - INFO - Processing document 4_2024-08-05
2025-11-14 17:23:00,763 - INFO - Finished converting document 4_2024-08-05 in 0.08 sec.
2025-11-14 17:23:00,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:00,803 - INFO - Going to convert document batch...
2025-11-14 17:23:00,804 - INFO - Processing document 4_2024-08-08
2025-11-14 17:23:00,822 - INFO - Finished converting document 4_2024-08-08 in 0.03 sec.
2025-11-14 17:23:00,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:00,863 - INFO - Going to convert document batch...
2025-11-14 17:23:00,863 - 

Converted 'data\edgar_documents\NKE\4_2024-07-22' --> 'data\processed_data\NKE\4_2024-07-22.md'
Converted 'data\edgar_documents\NKE\4_2024-08-05' --> 'data\processed_data\NKE\4_2024-08-05.md'
Converted 'data\edgar_documents\NKE\4_2024-08-08' --> 'data\processed_data\NKE\4_2024-08-08.md'


2025-11-14 17:23:00,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:00,928 - INFO - Going to convert document batch...
2025-11-14 17:23:00,930 - INFO - Processing document 4_2024-09-04
2025-11-14 17:23:00,950 - INFO - Finished converting document 4_2024-09-04 in 0.05 sec.
2025-11-14 17:23:00,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:00,995 - INFO - Going to convert document batch...
2025-11-14 17:23:00,996 - INFO - Processing document 4_2024-09-11
2025-11-14 17:23:01,039 - INFO - Finished converting document 4_2024-09-11 in 0.06 sec.
2025-11-14 17:23:01,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,087 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NKE\4_2024-08-15' --> 'data\processed_data\NKE\4_2024-08-15.md'
Converted 'data\edgar_documents\NKE\4_2024-09-04' --> 'data\processed_data\NKE\4_2024-09-04.md'
Converted 'data\edgar_documents\NKE\4_2024-09-11' --> 'data\processed_data\NKE\4_2024-09-11.md'


2025-11-14 17:23:01,088 - INFO - Processing document 4_2024-09-19
2025-11-14 17:23:01,108 - INFO - Finished converting document 4_2024-09-19 in 0.05 sec.
2025-11-14 17:23:01,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,153 - INFO - Going to convert document batch...
2025-11-14 17:23:01,154 - INFO - Processing document 4_2024-10-16
2025-11-14 17:23:01,177 - INFO - Finished converting document 4_2024-10-16 in 0.05 sec.
2025-11-14 17:23:01,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,218 - INFO - Going to convert document batch...
2025-11-14 17:23:01,219 - INFO - Processing document 4_2024-10-31
2025-11-14 17:23:01,239 - INFO - Finished converting document 4_2024-10-31 in 0.03 sec.
2025-11-14 17:23:01,270 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,280 - INFO - Going to convert document batch...
2025-11-14 17:23:01,281 - INFO - Processing document 4_2024-11-15
2025-11-14 17:23:01,303 - IN

Converted 'data\edgar_documents\NKE\4_2024-09-19' --> 'data\processed_data\NKE\4_2024-09-19.md'
Converted 'data\edgar_documents\NKE\4_2024-10-16' --> 'data\processed_data\NKE\4_2024-10-16.md'
Converted 'data\edgar_documents\NKE\4_2024-10-31' --> 'data\processed_data\NKE\4_2024-10-31.md'


2025-11-14 17:23:01,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,348 - INFO - Going to convert document batch...
2025-11-14 17:23:01,349 - INFO - Processing document 4_2024-11-27
2025-11-14 17:23:01,372 - INFO - Finished converting document 4_2024-11-27 in 0.05 sec.
2025-11-14 17:23:01,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,439 - INFO - Going to convert document batch...
2025-11-14 17:23:01,440 - INFO - Processing document 4_2024-12-30
2025-11-14 17:23:01,463 - INFO - Finished converting document 4_2024-12-30 in 0.08 sec.
2025-11-14 17:23:01,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\4_2024-11-15' --> 'data\processed_data\NKE\4_2024-11-15.md'
Converted 'data\edgar_documents\NKE\4_2024-11-27' --> 'data\processed_data\NKE\4_2024-11-27.md'
Converted 'data\edgar_documents\NKE\4_2024-12-30' --> 'data\processed_data\NKE\4_2024-12-30.md'


2025-11-14 17:23:01,537 - INFO - Going to convert document batch...
2025-11-14 17:23:01,538 - INFO - Processing document 4_2025-01-08
2025-11-14 17:23:01,563 - INFO - Finished converting document 4_2025-01-08 in 0.06 sec.
2025-11-14 17:23:01,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,631 - INFO - Going to convert document batch...
2025-11-14 17:23:01,633 - INFO - Processing document 4_2025-02-12
2025-11-14 17:23:01,672 - INFO - Finished converting document 4_2025-02-12 in 0.08 sec.
2025-11-14 17:23:01,707 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,719 - INFO - Going to convert document batch...
2025-11-14 17:23:01,720 - INFO - Processing document 4_2025-02-18
2025-11-14 17:23:01,748 - INFO - Finished converting document 4_2025-02-18 in 0.06 sec.
2025-11-14 17:23:01,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\4_2025-01-08' --> 'data\processed_data\NKE\4_2025-01-08.md'
Converted 'data\edgar_documents\NKE\4_2025-02-12' --> 'data\processed_data\NKE\4_2025-02-12.md'
Converted 'data\edgar_documents\NKE\4_2025-02-18' --> 'data\processed_data\NKE\4_2025-02-18.md'


2025-11-14 17:23:01,794 - INFO - Going to convert document batch...
2025-11-14 17:23:01,795 - INFO - Processing document 4_2025-04-07
2025-11-14 17:23:01,813 - INFO - Finished converting document 4_2025-04-07 in 0.05 sec.
2025-11-14 17:23:01,848 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,857 - INFO - Going to convert document batch...
2025-11-14 17:23:01,858 - INFO - Processing document 4_2025-04-25
2025-11-14 17:23:01,880 - INFO - Finished converting document 4_2025-04-25 in 0.05 sec.
2025-11-14 17:23:01,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:01,929 - INFO - Going to convert document batch...
2025-11-14 17:23:01,930 - INFO - Processing document 4_2025-05-15
2025-11-14 17:23:01,958 - INFO - Finished converting document 4_2025-05-15 in 0.05 sec.
2025-11-14 17:23:01,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,002 - INFO - Going to convert document batch...
2025-11-14 17:23:02,003 - 

Converted 'data\edgar_documents\NKE\4_2025-04-07' --> 'data\processed_data\NKE\4_2025-04-07.md'
Converted 'data\edgar_documents\NKE\4_2025-04-25' --> 'data\processed_data\NKE\4_2025-04-25.md'
Converted 'data\edgar_documents\NKE\4_2025-05-15' --> 'data\processed_data\NKE\4_2025-05-15.md'


2025-11-14 17:23:02,027 - INFO - Finished converting document 4_2025-07-11 in 0.05 sec.
2025-11-14 17:23:02,079 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,094 - INFO - Going to convert document batch...
2025-11-14 17:23:02,095 - INFO - Processing document 4_2025-07-17
2025-11-14 17:23:02,124 - INFO - Finished converting document 4_2025-07-17 in 0.06 sec.
2025-11-14 17:23:02,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,168 - INFO - Going to convert document batch...
2025-11-14 17:23:02,168 - INFO - Processing document 4_2025-08-04
2025-11-14 17:23:02,188 - INFO - Finished converting document 4_2025-08-04 in 0.05 sec.
2025-11-14 17:23:02,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,228 - INFO - Going to convert document batch...
2025-11-14 17:23:02,229 - INFO - Processing document 4_2025-08-06
2025-11-14 17:23:02,248 - INFO - Finished converting document 4_2025-08-06 in 0.05 sec.


Converted 'data\edgar_documents\NKE\4_2025-07-11' --> 'data\processed_data\NKE\4_2025-07-11.md'
Converted 'data\edgar_documents\NKE\4_2025-07-17' --> 'data\processed_data\NKE\4_2025-07-17.md'
Converted 'data\edgar_documents\NKE\4_2025-08-04' --> 'data\processed_data\NKE\4_2025-08-04.md'


2025-11-14 17:23:02,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,289 - INFO - Going to convert document batch...
2025-11-14 17:23:02,290 - INFO - Processing document 4_2025-08-14
2025-11-14 17:23:02,310 - INFO - Finished converting document 4_2025-08-14 in 0.05 sec.
2025-11-14 17:23:02,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,357 - INFO - Going to convert document batch...
2025-11-14 17:23:02,359 - INFO - Processing document 4_2025-08-18
2025-11-14 17:23:02,384 - INFO - Finished converting document 4_2025-08-18 in 0.05 sec.
2025-11-14 17:23:02,419 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,430 - INFO - Going to convert document batch...
2025-11-14 17:23:02,430 - INFO - Processing document 4_2025-09-03
2025-11-14 17:23:02,454 - INFO - Finished converting document 4_2025-09-03 in 0.05 sec.


Converted 'data\edgar_documents\NKE\4_2025-08-06' --> 'data\processed_data\NKE\4_2025-08-06.md'
Converted 'data\edgar_documents\NKE\4_2025-08-14' --> 'data\processed_data\NKE\4_2025-08-14.md'
Converted 'data\edgar_documents\NKE\4_2025-08-18' --> 'data\processed_data\NKE\4_2025-08-18.md'


2025-11-14 17:23:02,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,498 - INFO - Going to convert document batch...
2025-11-14 17:23:02,499 - INFO - Processing document 4_2025-09-08
2025-11-14 17:23:02,521 - INFO - Finished converting document 4_2025-09-08 in 0.05 sec.
2025-11-14 17:23:02,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,563 - INFO - Going to convert document batch...
2025-11-14 17:23:02,564 - INFO - Processing document 4_2025-09-11
2025-11-14 17:23:02,584 - INFO - Finished converting document 4_2025-09-11 in 0.03 sec.
2025-11-14 17:23:02,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,624 - INFO - Going to convert document batch...
2025-11-14 17:23:02,624 - INFO - Processing document 4_2025-10-03
2025-11-14 17:23:02,645 - INFO - Finished converting document 4_2025-10-03 in 0.03 sec.


Converted 'data\edgar_documents\NKE\4_2025-09-03' --> 'data\processed_data\NKE\4_2025-09-03.md'
Converted 'data\edgar_documents\NKE\4_2025-09-08' --> 'data\processed_data\NKE\4_2025-09-08.md'
Converted 'data\edgar_documents\NKE\4_2025-09-11' --> 'data\processed_data\NKE\4_2025-09-11.md'


2025-11-14 17:23:02,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,685 - INFO - Going to convert document batch...
2025-11-14 17:23:02,686 - INFO - Processing document 4_2025-10-07
2025-11-14 17:23:02,706 - INFO - Finished converting document 4_2025-10-07 in 0.03 sec.
2025-11-14 17:23:02,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,754 - INFO - Going to convert document batch...
2025-11-14 17:23:02,755 - INFO - Processing document 4_2025-10-16
2025-11-14 17:23:02,783 - INFO - Finished converting document 4_2025-10-16 in 0.05 sec.
2025-11-14 17:23:02,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\4_2025-10-03' --> 'data\processed_data\NKE\4_2025-10-03.md'
Converted 'data\edgar_documents\NKE\4_2025-10-07' --> 'data\processed_data\NKE\4_2025-10-07.md'
Converted 'data\edgar_documents\NKE\4_2025-10-16' --> 'data\processed_data\NKE\4_2025-10-16.md'


2025-11-14 17:23:02,862 - INFO - Going to convert document batch...
2025-11-14 17:23:02,863 - INFO - Processing document 4_2025-11-10
2025-11-14 17:23:02,881 - INFO - Finished converting document 4_2025-11-10 in 0.05 sec.
2025-11-14 17:23:02,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,931 - INFO - Going to convert document batch...
2025-11-14 17:23:02,932 - INFO - Processing document 8-K_2023-03-13
2025-11-14 17:23:02,955 - INFO - Finished converting document 8-K_2023-03-13 in 0.05 sec.
2025-11-14 17:23:02,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:02,989 - INFO - Going to convert document batch...
2025-11-14 17:23:02,990 - INFO - Processing document 8-K_2023-03-21
2025-11-14 17:23:03,004 - INFO - Finished converting document 8-K_2023-03-21 in 0.03 sec.
2025-11-14 17:23:03,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,039 - INFO - Going to convert document batch...
2025-11-14 17:23:0

Converted 'data\edgar_documents\NKE\4_2025-11-10' --> 'data\processed_data\NKE\4_2025-11-10.md'
Converted 'data\edgar_documents\NKE\8-K_2023-03-13' --> 'data\processed_data\NKE\8-K_2023-03-13.md'
Converted 'data\edgar_documents\NKE\8-K_2023-03-21' --> 'data\processed_data\NKE\8-K_2023-03-21.md'
Converted 'data\edgar_documents\NKE\8-K_2023-05-09' --> 'data\processed_data\NKE\8-K_2023-05-09.md'


2025-11-14 17:23:03,090 - INFO - Processing document 8-K_2023-05-24
2025-11-14 17:23:03,105 - INFO - Finished converting document 8-K_2023-05-24 in 0.05 sec.
2025-11-14 17:23:03,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,139 - INFO - Going to convert document batch...
2025-11-14 17:23:03,139 - INFO - Processing document 8-K_2023-06-29
2025-11-14 17:23:03,157 - INFO - Finished converting document 8-K_2023-06-29 in 0.05 sec.
2025-11-14 17:23:03,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,207 - INFO - Going to convert document batch...
2025-11-14 17:23:03,208 - INFO - Processing document 8-K_2023-09-15
2025-11-14 17:23:03,247 - INFO - Finished converting document 8-K_2023-09-15 in 0.08 sec.
2025-11-14 17:23:03,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,290 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NKE\8-K_2023-05-24' --> 'data\processed_data\NKE\8-K_2023-05-24.md'
Converted 'data\edgar_documents\NKE\8-K_2023-06-29' --> 'data\processed_data\NKE\8-K_2023-06-29.md'
Converted 'data\edgar_documents\NKE\8-K_2023-09-15' --> 'data\processed_data\NKE\8-K_2023-09-15.md'


2025-11-14 17:23:03,291 - INFO - Processing document 8-K_2023-09-28
2025-11-14 17:23:03,309 - INFO - Finished converting document 8-K_2023-09-28 in 0.05 sec.
2025-11-14 17:23:03,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,354 - INFO - Going to convert document batch...
2025-11-14 17:23:03,356 - INFO - Processing document 8-K_2023-12-21
2025-11-14 17:23:03,392 - INFO - Finished converting document 8-K_2023-12-21 in 0.08 sec.
2025-11-14 17:23:03,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,437 - INFO - Going to convert document batch...
2025-11-14 17:23:03,438 - INFO - Processing document 8-K_2024-03-11
2025-11-14 17:23:03,461 - INFO - Finished converting document 8-K_2024-03-11 in 0.05 sec.
2025-11-14 17:23:03,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,498 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NKE\8-K_2023-09-28' --> 'data\processed_data\NKE\8-K_2023-09-28.md'
Converted 'data\edgar_documents\NKE\8-K_2023-12-21' --> 'data\processed_data\NKE\8-K_2023-12-21.md'
Converted 'data\edgar_documents\NKE\8-K_2024-03-11' --> 'data\processed_data\NKE\8-K_2024-03-11.md'


2025-11-14 17:23:03,499 - INFO - Processing document 8-K_2024-03-21
2025-11-14 17:23:03,516 - INFO - Finished converting document 8-K_2024-03-21 in 0.05 sec.
2025-11-14 17:23:03,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,548 - INFO - Going to convert document batch...
2025-11-14 17:23:03,550 - INFO - Processing document 8-K_2024-06-05
2025-11-14 17:23:03,564 - INFO - Finished converting document 8-K_2024-06-05 in 0.05 sec.
2025-11-14 17:23:03,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,594 - INFO - Going to convert document batch...
2025-11-14 17:23:03,595 - INFO - Processing document 8-K_2024-06-27
2025-11-14 17:23:03,611 - INFO - Finished converting document 8-K_2024-06-27 in 0.03 sec.
2025-11-14 17:23:03,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,653 - INFO - Going to convert document batch...
2025-11-14 17:23:03,654 - INFO - Processing document 8-K_2024-09-13
2025-11-14 17:

Converted 'data\edgar_documents\NKE\8-K_2024-03-21' --> 'data\processed_data\NKE\8-K_2024-03-21.md'
Converted 'data\edgar_documents\NKE\8-K_2024-06-05' --> 'data\processed_data\NKE\8-K_2024-06-05.md'
Converted 'data\edgar_documents\NKE\8-K_2024-06-27' --> 'data\processed_data\NKE\8-K_2024-06-27.md'


2025-11-14 17:23:03,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,738 - INFO - Going to convert document batch...
2025-11-14 17:23:03,739 - INFO - Processing document 8-K_2024-09-19
2025-11-14 17:23:03,761 - INFO - Finished converting document 8-K_2024-09-19 in 0.05 sec.
2025-11-14 17:23:03,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,795 - INFO - Going to convert document batch...
2025-11-14 17:23:03,796 - INFO - Processing document 8-K_2024-09-20
2025-11-14 17:23:03,813 - INFO - Finished converting document 8-K_2024-09-20 in 0.05 sec.
2025-11-14 17:23:03,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,843 - INFO - Going to convert document batch...
2025-11-14 17:23:03,844 - INFO - Processing document 8-K_2024-10-01
2025-11-14 17:23:03,861 - INFO - Finished converting document 8-K_2024-10-01 in 0.03 sec.
2025-11-14 17:23:03,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\NKE\8-K_2024-09-13' --> 'data\processed_data\NKE\8-K_2024-09-13.md'
Converted 'data\edgar_documents\NKE\8-K_2024-09-19' --> 'data\processed_data\NKE\8-K_2024-09-19.md'
Converted 'data\edgar_documents\NKE\8-K_2024-09-20' --> 'data\processed_data\NKE\8-K_2024-09-20.md'
Converted 'data\edgar_documents\NKE\8-K_2024-10-01' --> 'data\processed_data\NKE\8-K_2024-10-01.md'


2025-11-14 17:23:03,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:03,943 - INFO - Going to convert document batch...
2025-11-14 17:23:03,945 - INFO - Processing document 8-K_2025-03-10
2025-11-14 17:23:03,969 - INFO - Finished converting document 8-K_2025-03-10 in 0.05 sec.
2025-11-14 17:23:03,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:04,013 - INFO - Going to convert document batch...
2025-11-14 17:23:04,014 - INFO - Processing document 8-K_2025-03-20
2025-11-14 17:23:04,038 - INFO - Finished converting document 8-K_2025-03-20 in 0.05 sec.
2025-11-14 17:23:04,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:04,092 - INFO - Going to convert document batch...
2025-11-14 17:23:04,094 - INFO - Processing document 8-K_2025-05-05
2025-11-14 17:23:04,111 - INFO - Finished converting document 8-K_2025-05-05 in 0.06 sec.


Converted 'data\edgar_documents\NKE\8-K_2024-12-19' --> 'data\processed_data\NKE\8-K_2024-12-19.md'
Converted 'data\edgar_documents\NKE\8-K_2025-03-10' --> 'data\processed_data\NKE\8-K_2025-03-10.md'
Converted 'data\edgar_documents\NKE\8-K_2025-03-20' --> 'data\processed_data\NKE\8-K_2025-03-20.md'


2025-11-14 17:23:04,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:04,160 - INFO - Going to convert document batch...
2025-11-14 17:23:04,161 - INFO - Processing document 8-K_2025-06-18
2025-11-14 17:23:04,174 - INFO - Finished converting document 8-K_2025-06-18 in 0.05 sec.
2025-11-14 17:23:04,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:04,205 - INFO - Going to convert document batch...
2025-11-14 17:23:04,205 - INFO - Processing document 8-K_2025-06-25
2025-11-14 17:23:04,222 - INFO - Finished converting document 8-K_2025-06-25 in 0.03 sec.
2025-11-14 17:23:04,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:04,255 - INFO - Going to convert document batch...
2025-11-14 17:23:04,256 - INFO - Processing document 8-K_2025-06-26
2025-11-14 17:23:04,272 - INFO - Finished converting document 8-K_2025-06-26 in 0.03 sec.
2025-11-14 17:23:04,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\NKE\8-K_2025-05-05' --> 'data\processed_data\NKE\8-K_2025-05-05.md'
Converted 'data\edgar_documents\NKE\8-K_2025-06-18' --> 'data\processed_data\NKE\8-K_2025-06-18.md'
Converted 'data\edgar_documents\NKE\8-K_2025-06-25' --> 'data\processed_data\NKE\8-K_2025-06-25.md'
Converted 'data\edgar_documents\NKE\8-K_2025-06-26' --> 'data\processed_data\NKE\8-K_2025-06-26.md'


2025-11-14 17:23:04,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:04,356 - INFO - Going to convert document batch...
2025-11-14 17:23:04,357 - INFO - Processing document 8-K_2025-09-11
2025-11-14 17:23:04,402 - INFO - Finished converting document 8-K_2025-09-11 in 0.08 sec.
2025-11-14 17:23:04,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:04,459 - INFO - Going to convert document batch...
2025-11-14 17:23:04,460 - INFO - Processing document 8-K_2025-09-30
2025-11-14 17:23:04,476 - INFO - Finished converting document 8-K_2025-09-30 in 0.05 sec.
2025-11-14 17:23:04,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\8-K_2025-07-28' --> 'data\processed_data\NKE\8-K_2025-07-28.md'
Converted 'data\edgar_documents\NKE\8-K_2025-09-11' --> 'data\processed_data\NKE\8-K_2025-09-11.md'
Converted 'data\edgar_documents\NKE\8-K_2025-09-30' --> 'data\processed_data\NKE\8-K_2025-09-30.md'


2025-11-14 17:23:04,999 - INFO - Going to convert document batch...
2025-11-14 17:23:05,000 - INFO - Processing document DEF-14A_2023-07-20
2025-11-14 17:23:06,195 - INFO - Finished converting document DEF-14A_2023-07-20 in 1.70 sec.
2025-11-14 17:23:06,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\DEF-14A_2023-07-20' --> 'data\processed_data\NKE\DEF-14A_2023-07-20.md'


2025-11-14 17:23:07,085 - INFO - Going to convert document batch...
2025-11-14 17:23:07,086 - INFO - Processing document DEF-14A_2024-07-25
2025-11-14 17:23:08,571 - INFO - Finished converting document DEF-14A_2024-07-25 in 1.75 sec.
2025-11-14 17:23:09,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\DEF-14A_2024-07-25' --> 'data\processed_data\NKE\DEF-14A_2024-07-25.md'


2025-11-14 17:23:09,483 - INFO - Going to convert document batch...
2025-11-14 17:23:09,484 - INFO - Processing document DEF-14A_2025-07-17
2025-11-14 17:23:10,886 - INFO - Finished converting document DEF-14A_2025-07-17 in 1.77 sec.
2025-11-14 17:23:11,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NKE\DEF-14A_2025-07-17' --> 'data\processed_data\NKE\DEF-14A_2025-07-17.md'
Processed 105 new files. Errors: 0
Found 162 files to process in data\edgar_documents\NOW


2025-11-14 17:23:12,456 - INFO - Going to convert document batch...
2025-11-14 17:23:12,457 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:23:12,457 - INFO - Processing document 10-K_2023-01-31
2025-11-14 17:23:13,921 - INFO - Finished converting document 10-K_2023-01-31 in 2.27 sec.
2025-11-14 17:23:14,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-K_2023-01-31' --> 'data\processed_data\NOW\10-K_2023-01-31.md'


2025-11-14 17:23:14,790 - INFO - Going to convert document batch...
2025-11-14 17:23:14,791 - INFO - Processing document 10-K_2024-01-25
2025-11-14 17:23:16,367 - INFO - Finished converting document 10-K_2024-01-25 in 2.01 sec.
2025-11-14 17:23:16,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-K_2024-01-25' --> 'data\processed_data\NOW\10-K_2024-01-25.md'


2025-11-14 17:23:17,259 - INFO - Going to convert document batch...
2025-11-14 17:23:17,260 - INFO - Processing document 10-K_2025-01-30
2025-11-14 17:23:18,712 - INFO - Finished converting document 10-K_2025-01-30 in 1.92 sec.
2025-11-14 17:23:19,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-K_2025-01-30' --> 'data\processed_data\NOW\10-K_2025-01-30.md'


2025-11-14 17:23:19,445 - INFO - Going to convert document batch...
2025-11-14 17:23:19,446 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 17:23:20,326 - INFO - Finished converting document 10-Q_2023-04-27 in 1.17 sec.
2025-11-14 17:23:20,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-Q_2023-04-27' --> 'data\processed_data\NOW\10-Q_2023-04-27.md'


2025-11-14 17:23:20,928 - INFO - Going to convert document batch...
2025-11-14 17:23:20,929 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 17:23:21,514 - INFO - Finished converting document 10-Q_2023-07-27 in 0.92 sec.
2025-11-14 17:23:21,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-Q_2023-07-27' --> 'data\processed_data\NOW\10-Q_2023-07-27.md'


2025-11-14 17:23:22,157 - INFO - Going to convert document batch...
2025-11-14 17:23:22,157 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 17:23:22,802 - INFO - Finished converting document 10-Q_2023-10-26 in 0.98 sec.
2025-11-14 17:23:23,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-Q_2023-10-26' --> 'data\processed_data\NOW\10-Q_2023-10-26.md'


2025-11-14 17:23:23,759 - INFO - Going to convert document batch...
2025-11-14 17:23:23,760 - INFO - Processing document 10-Q_2024-05-06
2025-11-14 17:23:24,327 - INFO - Finished converting document 10-Q_2024-05-06 in 0.86 sec.
2025-11-14 17:23:24,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-Q_2024-05-06' --> 'data\processed_data\NOW\10-Q_2024-05-06.md'


2025-11-14 17:23:24,932 - INFO - Going to convert document batch...
2025-11-14 17:23:24,933 - INFO - Processing document 10-Q_2024-07-25
2025-11-14 17:23:25,537 - INFO - Finished converting document 10-Q_2024-07-25 in 0.94 sec.
2025-11-14 17:23:26,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-Q_2024-07-25' --> 'data\processed_data\NOW\10-Q_2024-07-25.md'


2025-11-14 17:23:26,481 - INFO - Going to convert document batch...
2025-11-14 17:23:26,482 - INFO - Processing document 10-Q_2024-10-24
2025-11-14 17:23:27,124 - INFO - Finished converting document 10-Q_2024-10-24 in 0.98 sec.
2025-11-14 17:23:27,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-Q_2024-10-24' --> 'data\processed_data\NOW\10-Q_2024-10-24.md'


2025-11-14 17:23:27,766 - INFO - Going to convert document batch...
2025-11-14 17:23:27,767 - INFO - Processing document 10-Q_2025-04-23
2025-11-14 17:23:28,603 - INFO - Finished converting document 10-Q_2025-04-23 in 1.14 sec.
2025-11-14 17:23:28,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-Q_2025-04-23' --> 'data\processed_data\NOW\10-Q_2025-04-23.md'


2025-11-14 17:23:29,240 - INFO - Going to convert document batch...
2025-11-14 17:23:29,240 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 17:23:29,857 - INFO - Finished converting document 10-Q_2025-07-24 in 0.97 sec.
2025-11-14 17:23:30,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\10-Q_2025-07-24' --> 'data\processed_data\NOW\10-Q_2025-07-24.md'


2025-11-14 17:23:30,507 - INFO - Going to convert document batch...
2025-11-14 17:23:30,508 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 17:23:31,416 - INFO - Finished converting document 10-Q_2025-10-30 in 1.25 sec.
2025-11-14 17:23:31,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:31,756 - INFO - Going to convert document batch...
2025-11-14 17:23:31,757 - INFO - Processing document 4_2023-01-10
2025-11-14 17:23:31,777 - INFO - Finished converting document 4_2023-01-10 in 0.05 sec.
2025-11-14 17:23:31,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:31,844 - INFO - Going to convert document batch...
2025-11-14 17:23:31,845 - INFO - Processing document 4_2023-01-18
2025-11-14 17:23:31,865 - INFO - Finished converting document 4_2023-01-18 in 0.06 sec.
2025-11-14 17:23:31,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:31,904 - INFO - Going to convert document batch...
2025-11-14 17:23:31,

Converted 'data\edgar_documents\NOW\10-Q_2025-10-30' --> 'data\processed_data\NOW\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\NOW\4_2023-01-10' --> 'data\processed_data\NOW\4_2023-01-10.md'
Converted 'data\edgar_documents\NOW\4_2023-01-18' --> 'data\processed_data\NOW\4_2023-01-18.md'


2025-11-14 17:23:31,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:31,966 - INFO - Going to convert document batch...
2025-11-14 17:23:31,968 - INFO - Processing document 4_2023-01-31
2025-11-14 17:23:31,988 - INFO - Finished converting document 4_2023-01-31 in 0.05 sec.
2025-11-14 17:23:32,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,047 - INFO - Going to convert document batch...
2025-11-14 17:23:32,047 - INFO - Processing document 4_2023-02-03
2025-11-14 17:23:32,088 - INFO - Finished converting document 4_2023-02-03 in 0.08 sec.


Converted 'data\edgar_documents\NOW\4_2023-01-25' --> 'data\processed_data\NOW\4_2023-01-25.md'
Converted 'data\edgar_documents\NOW\4_2023-01-31' --> 'data\processed_data\NOW\4_2023-01-31.md'


2025-11-14 17:23:32,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,154 - INFO - Going to convert document batch...
2025-11-14 17:23:32,155 - INFO - Processing document 4_2023-02-09
2025-11-14 17:23:32,184 - INFO - Finished converting document 4_2023-02-09 in 0.06 sec.
2025-11-14 17:23:32,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,257 - INFO - Going to convert document batch...
2025-11-14 17:23:32,259 - INFO - Processing document 4_2023-02-14
2025-11-14 17:23:32,287 - INFO - Finished converting document 4_2023-02-14 in 0.06 sec.


Converted 'data\edgar_documents\NOW\4_2023-02-03' --> 'data\processed_data\NOW\4_2023-02-03.md'
Converted 'data\edgar_documents\NOW\4_2023-02-09' --> 'data\processed_data\NOW\4_2023-02-09.md'


2025-11-14 17:23:32,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,332 - INFO - Going to convert document batch...
2025-11-14 17:23:32,333 - INFO - Processing document 4_2023-02-17
2025-11-14 17:23:32,356 - INFO - Finished converting document 4_2023-02-17 in 0.05 sec.
2025-11-14 17:23:32,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,416 - INFO - Going to convert document batch...
2025-11-14 17:23:32,417 - INFO - Processing document 4_2023-02-22
2025-11-14 17:23:32,445 - INFO - Finished converting document 4_2023-02-22 in 0.06 sec.
2025-11-14 17:23:32,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,491 - INFO - Going to convert document batch...
2025-11-14 17:23:32,492 - INFO - Processing document 4_2023-02-28
2025-11-14 17:23:32,510 - INFO - Finished converting document 4_2023-02-28 in 0.03 sec.


Converted 'data\edgar_documents\NOW\4_2023-02-14' --> 'data\processed_data\NOW\4_2023-02-14.md'
Converted 'data\edgar_documents\NOW\4_2023-02-17' --> 'data\processed_data\NOW\4_2023-02-17.md'
Converted 'data\edgar_documents\NOW\4_2023-02-22' --> 'data\processed_data\NOW\4_2023-02-22.md'


2025-11-14 17:23:32,543 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,551 - INFO - Going to convert document batch...
2025-11-14 17:23:32,552 - INFO - Processing document 4_2023-03-23
2025-11-14 17:23:32,571 - INFO - Finished converting document 4_2023-03-23 in 0.03 sec.
2025-11-14 17:23:32,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,617 - INFO - Going to convert document batch...
2025-11-14 17:23:32,618 - INFO - Processing document 4_2023-04-10
2025-11-14 17:23:32,644 - INFO - Finished converting document 4_2023-04-10 in 0.05 sec.
2025-11-14 17:23:32,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,692 - INFO - Going to convert document batch...
2025-11-14 17:23:32,693 - INFO - Processing document 4_2023-04-18
2025-11-14 17:23:32,718 - INFO - Finished converting document 4_2023-04-18 in 0.05 sec.


Converted 'data\edgar_documents\NOW\4_2023-02-28' --> 'data\processed_data\NOW\4_2023-02-28.md'
Converted 'data\edgar_documents\NOW\4_2023-03-23' --> 'data\processed_data\NOW\4_2023-03-23.md'
Converted 'data\edgar_documents\NOW\4_2023-04-10' --> 'data\processed_data\NOW\4_2023-04-10.md'


2025-11-14 17:23:32,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,768 - INFO - Going to convert document batch...
2025-11-14 17:23:32,769 - INFO - Processing document 4_2023-05-02
2025-11-14 17:23:32,792 - INFO - Finished converting document 4_2023-05-02 in 0.05 sec.
2025-11-14 17:23:32,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,843 - INFO - Going to convert document batch...
2025-11-14 17:23:32,843 - INFO - Processing document 4_2023-05-08
2025-11-14 17:23:32,870 - INFO - Finished converting document 4_2023-05-08 in 0.06 sec.
2025-11-14 17:23:32,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:32,933 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NOW\4_2023-04-18' --> 'data\processed_data\NOW\4_2023-04-18.md'
Converted 'data\edgar_documents\NOW\4_2023-05-02' --> 'data\processed_data\NOW\4_2023-05-02.md'
Converted 'data\edgar_documents\NOW\4_2023-05-08' --> 'data\processed_data\NOW\4_2023-05-08.md'


2025-11-14 17:23:32,933 - INFO - Processing document 4_2023-05-09
2025-11-14 17:23:32,956 - INFO - Finished converting document 4_2023-05-09 in 0.05 sec.
2025-11-14 17:23:32,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,008 - INFO - Going to convert document batch...
2025-11-14 17:23:33,009 - INFO - Processing document 4_2023-05-10
2025-11-14 17:23:33,031 - INFO - Finished converting document 4_2023-05-10 in 0.05 sec.
2025-11-14 17:23:33,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,129 - INFO - Going to convert document batch...
2025-11-14 17:23:33,130 - INFO - Processing document 4_2023-05-12
2025-11-14 17:23:33,150 - INFO - Finished converting document 4_2023-05-12 in 0.05 sec.


Converted 'data\edgar_documents\NOW\4_2023-05-09' --> 'data\processed_data\NOW\4_2023-05-09.md'
Converted 'data\edgar_documents\NOW\4_2023-05-10' --> 'data\processed_data\NOW\4_2023-05-10.md'


2025-11-14 17:23:33,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,197 - INFO - Going to convert document batch...
2025-11-14 17:23:33,198 - INFO - Processing document 4_2023-05-16
2025-11-14 17:23:33,220 - INFO - Finished converting document 4_2023-05-16 in 0.05 sec.
2025-11-14 17:23:33,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,287 - INFO - Going to convert document batch...
2025-11-14 17:23:33,287 - INFO - Processing document 4_2023-05-19
2025-11-14 17:23:33,315 - INFO - Finished converting document 4_2023-05-19 in 0.06 sec.
2025-11-14 17:23:33,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\4_2023-05-12' --> 'data\processed_data\NOW\4_2023-05-12.md'
Converted 'data\edgar_documents\NOW\4_2023-05-16' --> 'data\processed_data\NOW\4_2023-05-16.md'
Converted 'data\edgar_documents\NOW\4_2023-05-19' --> 'data\processed_data\NOW\4_2023-05-19.md'


2025-11-14 17:23:33,386 - INFO - Going to convert document batch...
2025-11-14 17:23:33,387 - INFO - Processing document 4_2023-05-23
2025-11-14 17:23:33,406 - INFO - Finished converting document 4_2023-05-23 in 0.06 sec.
2025-11-14 17:23:33,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,452 - INFO - Going to convert document batch...
2025-11-14 17:23:33,453 - INFO - Processing document 4_2023-05-25
2025-11-14 17:23:33,472 - INFO - Finished converting document 4_2023-05-25 in 0.03 sec.
2025-11-14 17:23:33,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,519 - INFO - Going to convert document batch...
2025-11-14 17:23:33,519 - INFO - Processing document 4_2023-05-30
2025-11-14 17:23:33,538 - INFO - Finished converting document 4_2023-05-30 in 0.03 sec.
2025-11-14 17:23:33,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,581 - INFO - Going to convert document batch...
2025-11-14 17:23:33,581 - 

Converted 'data\edgar_documents\NOW\4_2023-05-23' --> 'data\processed_data\NOW\4_2023-05-23.md'
Converted 'data\edgar_documents\NOW\4_2023-05-25' --> 'data\processed_data\NOW\4_2023-05-25.md'
Converted 'data\edgar_documents\NOW\4_2023-05-30' --> 'data\processed_data\NOW\4_2023-05-30.md'


2025-11-14 17:23:33,637 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,647 - INFO - Going to convert document batch...
2025-11-14 17:23:33,647 - INFO - Processing document 4_2023-06-05
2025-11-14 17:23:33,672 - INFO - Finished converting document 4_2023-06-05 in 0.05 sec.
2025-11-14 17:23:33,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,723 - INFO - Going to convert document batch...
2025-11-14 17:23:33,725 - INFO - Processing document 4_2023-07-06
2025-11-14 17:23:33,749 - INFO - Finished converting document 4_2023-07-06 in 0.05 sec.
2025-11-14 17:23:33,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,796 - INFO - Going to convert document batch...
2025-11-14 17:23:33,796 - INFO - Processing document 4_2023-07-11


Converted 'data\edgar_documents\NOW\4_2023-06-01' --> 'data\processed_data\NOW\4_2023-06-01.md'
Converted 'data\edgar_documents\NOW\4_2023-06-05' --> 'data\processed_data\NOW\4_2023-06-05.md'
Converted 'data\edgar_documents\NOW\4_2023-07-06' --> 'data\processed_data\NOW\4_2023-07-06.md'


2025-11-14 17:23:33,819 - INFO - Finished converting document 4_2023-07-11 in 0.03 sec.
2025-11-14 17:23:33,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,870 - INFO - Going to convert document batch...
2025-11-14 17:23:33,871 - INFO - Processing document 4_2023-07-17
2025-11-14 17:23:33,894 - INFO - Finished converting document 4_2023-07-17 in 0.05 sec.
2025-11-14 17:23:33,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:33,936 - INFO - Going to convert document batch...
2025-11-14 17:23:33,936 - INFO - Processing document 4_2023-08-03
2025-11-14 17:23:33,959 - INFO - Finished converting document 4_2023-08-03 in 0.05 sec.
2025-11-14 17:23:33,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,001 - INFO - Going to convert document batch...
2025-11-14 17:23:34,002 - INFO - Processing document 4_2023-08-07
2025-11-14 17:23:34,022 - INFO - Finished converting document 4_2023-08-07 in 0.03 sec.


Converted 'data\edgar_documents\NOW\4_2023-07-11' --> 'data\processed_data\NOW\4_2023-07-11.md'
Converted 'data\edgar_documents\NOW\4_2023-07-17' --> 'data\processed_data\NOW\4_2023-07-17.md'
Converted 'data\edgar_documents\NOW\4_2023-08-03' --> 'data\processed_data\NOW\4_2023-08-03.md'
Converted 'data\edgar_documents\NOW\4_2023-08-07' --> 'data\processed_data\NOW\4_2023-08-07.md'


2025-11-14 17:23:34,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,058 - INFO - Going to convert document batch...
2025-11-14 17:23:34,059 - INFO - Processing document 4_2023-08-09
2025-11-14 17:23:34,077 - INFO - Finished converting document 4_2023-08-09 in 0.05 sec.
2025-11-14 17:23:34,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,138 - INFO - Going to convert document batch...
2025-11-14 17:23:34,139 - INFO - Processing document 4_2023-08-15
2025-11-14 17:23:34,177 - INFO - Finished converting document 4_2023-08-15 in 0.08 sec.
2025-11-14 17:23:34,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,222 - INFO - Going to convert document batch...
2025-11-14 17:23:34,223 - INFO - Processing document 4_2023-08-17
2025-11-14 17:23:34,246 - INFO - Finished converting document 4_2023-08-17 in 0.05 sec.


Converted 'data\edgar_documents\NOW\4_2023-08-09' --> 'data\processed_data\NOW\4_2023-08-09.md'
Converted 'data\edgar_documents\NOW\4_2023-08-15' --> 'data\processed_data\NOW\4_2023-08-15.md'
Converted 'data\edgar_documents\NOW\4_2023-08-17' --> 'data\processed_data\NOW\4_2023-08-17.md'


2025-11-14 17:23:34,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,313 - INFO - Going to convert document batch...
2025-11-14 17:23:34,313 - INFO - Processing document 4_2023-08-21
2025-11-14 17:23:34,341 - INFO - Finished converting document 4_2023-08-21 in 0.08 sec.
2025-11-14 17:23:34,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,384 - INFO - Going to convert document batch...
2025-11-14 17:23:34,385 - INFO - Processing document 4_2023-08-23
2025-11-14 17:23:34,403 - INFO - Finished converting document 4_2023-08-23 in 0.05 sec.
2025-11-14 17:23:34,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,443 - INFO - Going to convert document batch...
2025-11-14 17:23:34,444 - INFO - Processing document 4_2023-08-31
2025-11-14 17:23:34,460 - INFO - Finished converting document 4_2023-08-31 in 0.03 sec.
2025-11-14 17:23:34,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\NOW\4_2023-08-21' --> 'data\processed_data\NOW\4_2023-08-21.md'
Converted 'data\edgar_documents\NOW\4_2023-08-23' --> 'data\processed_data\NOW\4_2023-08-23.md'
Converted 'data\edgar_documents\NOW\4_2023-08-31' --> 'data\processed_data\NOW\4_2023-08-31.md'


2025-11-14 17:23:34,558 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,567 - INFO - Going to convert document batch...
2025-11-14 17:23:34,568 - INFO - Processing document 4_2023-10-03
2025-11-14 17:23:34,590 - INFO - Finished converting document 4_2023-10-03 in 0.05 sec.
2025-11-14 17:23:34,648 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,661 - INFO - Going to convert document batch...
2025-11-14 17:23:34,662 - INFO - Processing document 4_2023-10-10
2025-11-14 17:23:34,696 - INFO - Finished converting document 4_2023-10-10 in 0.08 sec.
2025-11-14 17:23:34,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\4_2023-09-05' --> 'data\processed_data\NOW\4_2023-09-05.md'
Converted 'data\edgar_documents\NOW\4_2023-10-03' --> 'data\processed_data\NOW\4_2023-10-03.md'
Converted 'data\edgar_documents\NOW\4_2023-10-10' --> 'data\processed_data\NOW\4_2023-10-10.md'


2025-11-14 17:23:34,741 - INFO - Going to convert document batch...
2025-11-14 17:23:34,742 - INFO - Processing document 4_2023-10-17
2025-11-14 17:23:34,765 - INFO - Finished converting document 4_2023-10-17 in 0.05 sec.
2025-11-14 17:23:34,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,812 - INFO - Going to convert document batch...
2025-11-14 17:23:34,812 - INFO - Processing document 4_2023-11-02
2025-11-14 17:23:34,833 - INFO - Finished converting document 4_2023-11-02 in 0.05 sec.
2025-11-14 17:23:34,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,873 - INFO - Going to convert document batch...
2025-11-14 17:23:34,874 - INFO - Processing document 4_2023-11-06
2025-11-14 17:23:34,893 - INFO - Finished converting document 4_2023-11-06 in 0.05 sec.
2025-11-14 17:23:34,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:34,932 - INFO - Going to convert document batch...
2025-11-14 17:23:34,933 - 

Converted 'data\edgar_documents\NOW\4_2023-10-17' --> 'data\processed_data\NOW\4_2023-10-17.md'
Converted 'data\edgar_documents\NOW\4_2023-11-02' --> 'data\processed_data\NOW\4_2023-11-02.md'
Converted 'data\edgar_documents\NOW\4_2023-11-06' --> 'data\processed_data\NOW\4_2023-11-06.md'
Converted 'data\edgar_documents\NOW\4_2023-11-09' --> 'data\processed_data\NOW\4_2023-11-09.md'


2025-11-14 17:23:35,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,014 - INFO - Going to convert document batch...
2025-11-14 17:23:35,015 - INFO - Processing document 4_2023-11-13
2025-11-14 17:23:35,032 - INFO - Finished converting document 4_2023-11-13 in 0.06 sec.
2025-11-14 17:23:35,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,092 - INFO - Going to convert document batch...
2025-11-14 17:23:35,093 - INFO - Processing document 4_2023-11-14
2025-11-14 17:23:35,123 - INFO - Finished converting document 4_2023-11-14 in 0.08 sec.
2025-11-14 17:23:35,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,166 - INFO - Going to convert document batch...
2025-11-14 17:23:35,167 - INFO - Processing document 4_2023-11-17
2025-11-14 17:23:35,189 - INFO - Finished converting document 4_2023-11-17 in 0.05 sec.
2025-11-14 17:23:35,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\4_2023-11-13' --> 'data\processed_data\NOW\4_2023-11-13.md'
Converted 'data\edgar_documents\NOW\4_2023-11-14' --> 'data\processed_data\NOW\4_2023-11-14.md'
Converted 'data\edgar_documents\NOW\4_2023-11-17' --> 'data\processed_data\NOW\4_2023-11-17.md'


2025-11-14 17:23:35,240 - INFO - Going to convert document batch...
2025-11-14 17:23:35,241 - INFO - Processing document 4_2023-11-21
2025-11-14 17:23:35,270 - INFO - Finished converting document 4_2023-11-21 in 0.05 sec.
2025-11-14 17:23:35,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,317 - INFO - Going to convert document batch...
2025-11-14 17:23:35,318 - INFO - Processing document 4_2023-11-27
2025-11-14 17:23:35,335 - INFO - Finished converting document 4_2023-11-27 in 0.03 sec.
2025-11-14 17:23:35,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,392 - INFO - Going to convert document batch...
2025-11-14 17:23:35,393 - INFO - Processing document 4_2023-11-29
2025-11-14 17:23:35,410 - INFO - Finished converting document 4_2023-11-29 in 0.05 sec.
2025-11-14 17:23:35,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,450 - INFO - Going to convert document batch...
2025-11-14 17:23:35,451 - 

Converted 'data\edgar_documents\NOW\4_2023-11-21' --> 'data\processed_data\NOW\4_2023-11-21.md'
Converted 'data\edgar_documents\NOW\4_2023-11-27' --> 'data\processed_data\NOW\4_2023-11-27.md'
Converted 'data\edgar_documents\NOW\4_2023-11-29' --> 'data\processed_data\NOW\4_2023-11-29.md'


2025-11-14 17:23:35,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,515 - INFO - Going to convert document batch...
2025-11-14 17:23:35,516 - INFO - Processing document 4_2024-01-10
2025-11-14 17:23:35,539 - INFO - Finished converting document 4_2024-01-10 in 0.05 sec.
2025-11-14 17:23:35,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,594 - INFO - Going to convert document batch...
2025-11-14 17:23:35,596 - INFO - Processing document 4_2024-01-17
2025-11-14 17:23:35,623 - INFO - Finished converting document 4_2024-01-17 in 0.06 sec.
2025-11-14 17:23:35,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,671 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NOW\4_2023-12-01' --> 'data\processed_data\NOW\4_2023-12-01.md'
Converted 'data\edgar_documents\NOW\4_2024-01-10' --> 'data\processed_data\NOW\4_2024-01-10.md'
Converted 'data\edgar_documents\NOW\4_2024-01-17' --> 'data\processed_data\NOW\4_2024-01-17.md'


2025-11-14 17:23:35,671 - INFO - Processing document 4_2024-01-24
2025-11-14 17:23:35,691 - INFO - Finished converting document 4_2024-01-24 in 0.03 sec.
2025-11-14 17:23:35,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,739 - INFO - Going to convert document batch...
2025-11-14 17:23:35,740 - INFO - Processing document 4_2024-01-31
2025-11-14 17:23:35,759 - INFO - Finished converting document 4_2024-01-31 in 0.03 sec.
2025-11-14 17:23:35,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,796 - INFO - Going to convert document batch...
2025-11-14 17:23:35,797 - INFO - Processing document 4_2024-02-06
2025-11-14 17:23:35,818 - INFO - Finished converting document 4_2024-02-06 in 0.03 sec.
2025-11-14 17:23:35,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:35,857 - INFO - Going to convert document batch...
2025-11-14 17:23:35,858 - INFO - Processing document 4_2024-02-08
2025-11-14 17:23:35,877 - IN

Converted 'data\edgar_documents\NOW\4_2024-01-24' --> 'data\processed_data\NOW\4_2024-01-24.md'
Converted 'data\edgar_documents\NOW\4_2024-01-31' --> 'data\processed_data\NOW\4_2024-01-31.md'
Converted 'data\edgar_documents\NOW\4_2024-02-06' --> 'data\processed_data\NOW\4_2024-02-06.md'
Converted 'data\edgar_documents\NOW\4_2024-02-08' --> 'data\processed_data\NOW\4_2024-02-08.md'


2025-11-14 17:23:35,922 - INFO - Going to convert document batch...
2025-11-14 17:23:35,923 - INFO - Processing document 4_2024-02-09
2025-11-14 17:23:35,957 - INFO - Finished converting document 4_2024-02-09 in 0.06 sec.
2025-11-14 17:23:36,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:36,045 - INFO - Going to convert document batch...
2025-11-14 17:23:36,045 - INFO - Processing document 4_2024-02-14
2025-11-14 17:23:36,071 - INFO - Finished converting document 4_2024-02-14 in 0.06 sec.
2025-11-14 17:23:36,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:36,115 - INFO - Going to convert document batch...
2025-11-14 17:23:36,115 - INFO - Processing document 4_2024-02-20
2025-11-14 17:23:36,135 - INFO - Finished converting document 4_2024-02-20 in 0.05 sec.
2025-11-14 17:23:36,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:36,183 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NOW\4_2024-02-09' --> 'data\processed_data\NOW\4_2024-02-09.md'
Converted 'data\edgar_documents\NOW\4_2024-02-14' --> 'data\processed_data\NOW\4_2024-02-14.md'
Converted 'data\edgar_documents\NOW\4_2024-02-20' --> 'data\processed_data\NOW\4_2024-02-20.md'


2025-11-14 17:23:36,184 - INFO - Processing document 4_2024-02-21
2025-11-14 17:23:36,215 - INFO - Finished converting document 4_2024-02-21 in 0.06 sec.
2025-11-14 17:23:36,257 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:36,265 - INFO - Going to convert document batch...
2025-11-14 17:23:36,266 - INFO - Processing document 4_2024-02-28
2025-11-14 17:23:36,285 - INFO - Finished converting document 4_2024-02-28 in 0.03 sec.
2025-11-14 17:23:36,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:36,342 - INFO - Going to convert document batch...
2025-11-14 17:23:36,343 - INFO - Processing document 4_2024-04-17
2025-11-14 17:23:36,366 - INFO - Finished converting document 4_2024-04-17 in 0.05 sec.
2025-11-14 17:23:36,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:36,410 - INFO - Going to convert document batch...
2025-11-14 17:23:36,410 - INFO - Processing document 4_2024-05-09


Converted 'data\edgar_documents\NOW\4_2024-02-21' --> 'data\processed_data\NOW\4_2024-02-21.md'
Converted 'data\edgar_documents\NOW\4_2024-02-28' --> 'data\processed_data\NOW\4_2024-02-28.md'
Converted 'data\edgar_documents\NOW\4_2024-04-17' --> 'data\processed_data\NOW\4_2024-04-17.md'


2025-11-14 17:23:36,810 - INFO - Finished converting document 4_2024-05-09 in 0.42 sec.
2025-11-14 17:23:36,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:36,853 - INFO - Going to convert document batch...
2025-11-14 17:23:36,854 - INFO - Processing document 4_2024-05-14
2025-11-14 17:23:36,876 - INFO - Finished converting document 4_2024-05-14 in 0.05 sec.
2025-11-14 17:23:36,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:36,917 - INFO - Going to convert document batch...
2025-11-14 17:23:36,918 - INFO - Processing document 4_2024-05-17
2025-11-14 17:23:36,941 - INFO - Finished converting document 4_2024-05-17 in 0.05 sec.
2025-11-14 17:23:36,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:36,983 - INFO - Going to convert document batch...
2025-11-14 17:23:36,984 - INFO - Processing document 4_2024-05-21
2025-11-14 17:23:37,004 - INFO - Finished converting document 4_2024-05-21 in 0.05 sec.


Converted 'data\edgar_documents\NOW\4_2024-05-09' --> 'data\processed_data\NOW\4_2024-05-09.md'
Converted 'data\edgar_documents\NOW\4_2024-05-14' --> 'data\processed_data\NOW\4_2024-05-14.md'
Converted 'data\edgar_documents\NOW\4_2024-05-17' --> 'data\processed_data\NOW\4_2024-05-17.md'
Converted 'data\edgar_documents\NOW\4_2024-05-21' --> 'data\processed_data\NOW\4_2024-05-21.md'


2025-11-14 17:23:37,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,058 - INFO - Going to convert document batch...
2025-11-14 17:23:37,059 - INFO - Processing document 4_2024-05-28
2025-11-14 17:23:37,078 - INFO - Finished converting document 4_2024-05-28 in 0.06 sec.
2025-11-14 17:23:37,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,154 - INFO - Going to convert document batch...
2025-11-14 17:23:37,154 - INFO - Processing document 4_2024-05-30
2025-11-14 17:23:37,171 - INFO - Finished converting document 4_2024-05-30 in 0.05 sec.
2025-11-14 17:23:37,215 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,227 - INFO - Going to convert document batch...
2025-11-14 17:23:37,228 - INFO - Processing document 4_2024-05-31
2025-11-14 17:23:37,258 - INFO - Finished converting document 4_2024-05-31 in 0.06 sec.
2025-11-14 17:23:37,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\NOW\4_2024-05-28' --> 'data\processed_data\NOW\4_2024-05-28.md'
Converted 'data\edgar_documents\NOW\4_2024-05-30' --> 'data\processed_data\NOW\4_2024-05-30.md'
Converted 'data\edgar_documents\NOW\4_2024-05-31' --> 'data\processed_data\NOW\4_2024-05-31.md'


2025-11-14 17:23:37,314 - INFO - Finished converting document 4_2024-06-05 in 0.05 sec.
2025-11-14 17:23:37,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,358 - INFO - Going to convert document batch...
2025-11-14 17:23:37,359 - INFO - Processing document 4_2024-06-07
2025-11-14 17:23:37,378 - INFO - Finished converting document 4_2024-06-07 in 0.05 sec.
2025-11-14 17:23:37,413 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,423 - INFO - Going to convert document batch...
2025-11-14 17:23:37,424 - INFO - Processing document 4_2024-07-01
2025-11-14 17:23:37,454 - INFO - Finished converting document 4_2024-07-01 in 0.06 sec.
2025-11-14 17:23:37,512 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\4_2024-06-05' --> 'data\processed_data\NOW\4_2024-06-05.md'
Converted 'data\edgar_documents\NOW\4_2024-06-07' --> 'data\processed_data\NOW\4_2024-06-07.md'
Converted 'data\edgar_documents\NOW\4_2024-07-01' --> 'data\processed_data\NOW\4_2024-07-01.md'


2025-11-14 17:23:37,521 - INFO - Going to convert document batch...
2025-11-14 17:23:37,521 - INFO - Processing document 4_2024-07-17
2025-11-14 17:23:37,542 - INFO - Finished converting document 4_2024-07-17 in 0.06 sec.
2025-11-14 17:23:37,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,586 - INFO - Going to convert document batch...
2025-11-14 17:23:37,586 - INFO - Processing document 4_2024-07-29
2025-11-14 17:23:37,610 - INFO - Finished converting document 4_2024-07-29 in 0.05 sec.
2025-11-14 17:23:37,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,653 - INFO - Going to convert document batch...
2025-11-14 17:23:37,653 - INFO - Processing document 4_2024-07-31
2025-11-14 17:23:37,674 - INFO - Finished converting document 4_2024-07-31 in 0.05 sec.
2025-11-14 17:23:37,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,713 - INFO - Going to convert document batch...
2025-11-14 17:23:37,714 - 

Converted 'data\edgar_documents\NOW\4_2024-07-17' --> 'data\processed_data\NOW\4_2024-07-17.md'
Converted 'data\edgar_documents\NOW\4_2024-07-29' --> 'data\processed_data\NOW\4_2024-07-29.md'
Converted 'data\edgar_documents\NOW\4_2024-07-31' --> 'data\processed_data\NOW\4_2024-07-31.md'
Converted 'data\edgar_documents\NOW\4_2024-08-06' --> 'data\processed_data\NOW\4_2024-08-06.md'


2025-11-14 17:23:37,775 - INFO - Going to convert document batch...
2025-11-14 17:23:37,776 - INFO - Processing document 4_2024-08-09
2025-11-14 17:23:37,810 - INFO - Finished converting document 4_2024-08-09 in 0.06 sec.
2025-11-14 17:23:37,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,864 - INFO - Going to convert document batch...
2025-11-14 17:23:37,865 - INFO - Processing document 4_2024-08-13
2025-11-14 17:23:37,888 - INFO - Finished converting document 4_2024-08-13 in 0.05 sec.
2025-11-14 17:23:37,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:37,929 - INFO - Going to convert document batch...
2025-11-14 17:23:37,929 - INFO - Processing document 4_2024-08-14
2025-11-14 17:23:37,955 - INFO - Finished converting document 4_2024-08-14 in 0.05 sec.
2025-11-14 17:23:37,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,000 - INFO - Going to convert document batch...
2025-11-14 17:23:38,001 - 

Converted 'data\edgar_documents\NOW\4_2024-08-09' --> 'data\processed_data\NOW\4_2024-08-09.md'
Converted 'data\edgar_documents\NOW\4_2024-08-13' --> 'data\processed_data\NOW\4_2024-08-13.md'
Converted 'data\edgar_documents\NOW\4_2024-08-14' --> 'data\processed_data\NOW\4_2024-08-14.md'


2025-11-14 17:23:38,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,064 - INFO - Going to convert document batch...
2025-11-14 17:23:38,065 - INFO - Processing document 4_2024-08-20
2025-11-14 17:23:38,124 - INFO - Finished converting document 4_2024-08-20 in 0.09 sec.
2025-11-14 17:23:38,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,181 - INFO - Going to convert document batch...
2025-11-14 17:23:38,182 - INFO - Processing document 4_2024-08-22
2025-11-14 17:23:38,202 - INFO - Finished converting document 4_2024-08-22 in 0.05 sec.


Converted 'data\edgar_documents\NOW\4_2024-08-16' --> 'data\processed_data\NOW\4_2024-08-16.md'
Converted 'data\edgar_documents\NOW\4_2024-08-20' --> 'data\processed_data\NOW\4_2024-08-20.md'


2025-11-14 17:23:38,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,242 - INFO - Going to convert document batch...
2025-11-14 17:23:38,242 - INFO - Processing document 4_2024-08-28
2025-11-14 17:23:38,259 - INFO - Finished converting document 4_2024-08-28 in 0.03 sec.
2025-11-14 17:23:38,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,318 - INFO - Going to convert document batch...
2025-11-14 17:23:38,318 - INFO - Processing document 4_2024-10-17
2025-11-14 17:23:38,342 - INFO - Finished converting document 4_2024-10-17 in 0.06 sec.
2025-11-14 17:23:38,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,385 - INFO - Going to convert document batch...
2025-11-14 17:23:38,386 - INFO - Processing document 4_2024-11-06
2025-11-14 17:23:38,404 - INFO - Finished converting document 4_2024-11-06 in 0.05 sec.


Converted 'data\edgar_documents\NOW\4_2024-08-22' --> 'data\processed_data\NOW\4_2024-08-22.md'
Converted 'data\edgar_documents\NOW\4_2024-08-28' --> 'data\processed_data\NOW\4_2024-08-28.md'
Converted 'data\edgar_documents\NOW\4_2024-10-17' --> 'data\processed_data\NOW\4_2024-10-17.md'


2025-11-14 17:23:38,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,458 - INFO - Going to convert document batch...
2025-11-14 17:23:38,459 - INFO - Processing document 4_2024-11-07
2025-11-14 17:23:38,499 - INFO - Finished converting document 4_2024-11-07 in 0.08 sec.
2025-11-14 17:23:38,550 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,563 - INFO - Going to convert document batch...
2025-11-14 17:23:38,564 - INFO - Processing document 4_2024-11-12
2025-11-14 17:23:38,593 - INFO - Finished converting document 4_2024-11-12 in 0.06 sec.
2025-11-14 17:23:38,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\4_2024-11-06' --> 'data\processed_data\NOW\4_2024-11-06.md'
Converted 'data\edgar_documents\NOW\4_2024-11-07' --> 'data\processed_data\NOW\4_2024-11-07.md'
Converted 'data\edgar_documents\NOW\4_2024-11-12' --> 'data\processed_data\NOW\4_2024-11-12.md'


2025-11-14 17:23:38,641 - INFO - Going to convert document batch...
2025-11-14 17:23:38,641 - INFO - Processing document 4_2024-11-14
2025-11-14 17:23:38,668 - INFO - Finished converting document 4_2024-11-14 in 0.06 sec.
2025-11-14 17:23:38,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,711 - INFO - Going to convert document batch...
2025-11-14 17:23:38,712 - INFO - Processing document 4_2024-11-18
2025-11-14 17:23:38,731 - INFO - Finished converting document 4_2024-11-18 in 0.05 sec.
2025-11-14 17:23:38,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,773 - INFO - Going to convert document batch...
2025-11-14 17:23:38,774 - INFO - Processing document 4_2024-11-19
2025-11-14 17:23:38,798 - INFO - Finished converting document 4_2024-11-19 in 0.05 sec.
2025-11-14 17:23:38,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,860 - INFO - Going to convert document batch...
2025-11-14 17:23:38,861 - 

Converted 'data\edgar_documents\NOW\4_2024-11-14' --> 'data\processed_data\NOW\4_2024-11-14.md'
Converted 'data\edgar_documents\NOW\4_2024-11-18' --> 'data\processed_data\NOW\4_2024-11-18.md'
Converted 'data\edgar_documents\NOW\4_2024-11-19' --> 'data\processed_data\NOW\4_2024-11-19.md'


2025-11-14 17:23:38,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,925 - INFO - Going to convert document batch...
2025-11-14 17:23:38,925 - INFO - Processing document 4_2024-11-27
2025-11-14 17:23:38,943 - INFO - Finished converting document 4_2024-11-27 in 0.03 sec.
2025-11-14 17:23:38,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:38,995 - INFO - Going to convert document batch...
2025-11-14 17:23:38,997 - INFO - Processing document 4_2024-12-03
2025-11-14 17:23:39,037 - INFO - Finished converting document 4_2024-12-03 in 0.08 sec.
2025-11-14 17:23:39,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\4_2024-11-21' --> 'data\processed_data\NOW\4_2024-11-21.md'
Converted 'data\edgar_documents\NOW\4_2024-11-27' --> 'data\processed_data\NOW\4_2024-11-27.md'
Converted 'data\edgar_documents\NOW\4_2024-12-03' --> 'data\processed_data\NOW\4_2024-12-03.md'


2025-11-14 17:23:39,109 - INFO - Going to convert document batch...
2025-11-14 17:23:39,110 - INFO - Processing document 4_2025-01-17
2025-11-14 17:23:39,133 - INFO - Finished converting document 4_2025-01-17 in 0.06 sec.
2025-11-14 17:23:39,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:39,182 - INFO - Going to convert document batch...
2025-11-14 17:23:39,182 - INFO - Processing document 4_2025-02-05
2025-11-14 17:23:39,210 - INFO - Finished converting document 4_2025-02-05 in 0.05 sec.
2025-11-14 17:23:39,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:39,264 - INFO - Going to convert document batch...
2025-11-14 17:23:39,264 - INFO - Processing document 4_2025-02-11
2025-11-14 17:23:39,283 - INFO - Finished converting document 4_2025-02-11 in 0.05 sec.
2025-11-14 17:23:39,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:39,323 - INFO - Going to convert document batch...
2025-11-14 17:23:39,324 - 

Converted 'data\edgar_documents\NOW\4_2025-01-17' --> 'data\processed_data\NOW\4_2025-01-17.md'
Converted 'data\edgar_documents\NOW\4_2025-02-05' --> 'data\processed_data\NOW\4_2025-02-05.md'
Converted 'data\edgar_documents\NOW\4_2025-02-11' --> 'data\processed_data\NOW\4_2025-02-11.md'


2025-11-14 17:23:39,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:39,398 - INFO - Going to convert document batch...
2025-11-14 17:23:39,399 - INFO - Processing document 4_2025-02-14
2025-11-14 17:23:39,450 - INFO - Finished converting document 4_2025-02-14 in 0.09 sec.
2025-11-14 17:23:39,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:39,528 - INFO - Going to convert document batch...
2025-11-14 17:23:39,528 - INFO - Processing document 4_2025-02-19
2025-11-14 17:23:39,558 - INFO - Finished converting document 4_2025-02-19 in 0.08 sec.


Converted 'data\edgar_documents\NOW\4_2025-02-12' --> 'data\processed_data\NOW\4_2025-02-12.md'
Converted 'data\edgar_documents\NOW\4_2025-02-14' --> 'data\processed_data\NOW\4_2025-02-14.md'


2025-11-14 17:23:39,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:39,608 - INFO - Going to convert document batch...
2025-11-14 17:23:39,609 - INFO - Processing document 4_2025-02-21
2025-11-14 17:23:39,642 - INFO - Finished converting document 4_2025-02-21 in 0.06 sec.
2025-11-14 17:23:39,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:39,694 - INFO - Going to convert document batch...
2025-11-14 17:23:39,695 - INFO - Processing document 4_2025-02-25
2025-11-14 17:23:39,712 - INFO - Finished converting document 4_2025-02-25 in 0.03 sec.
2025-11-14 17:23:39,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:39,750 - INFO - Going to convert document batch...
2025-11-14 17:23:39,751 - INFO - Processing document 4_2025-02-27


Converted 'data\edgar_documents\NOW\4_2025-02-19' --> 'data\processed_data\NOW\4_2025-02-19.md'
Converted 'data\edgar_documents\NOW\4_2025-02-21' --> 'data\processed_data\NOW\4_2025-02-21.md'
Converted 'data\edgar_documents\NOW\4_2025-02-25' --> 'data\processed_data\NOW\4_2025-02-25.md'


2025-11-14 17:23:39,770 - INFO - Finished converting document 4_2025-02-27 in 0.03 sec.
2025-11-14 17:23:39,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:39,810 - INFO - Going to convert document batch...
2025-11-14 17:23:39,811 - INFO - Processing document 4_2025-03-03
2025-11-14 17:23:39,829 - INFO - Finished converting document 4_2025-03-03 in 0.03 sec.
2025-11-14 17:23:39,864 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:23:39,865 - ERROR - Input document 4_2025-03-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\NOW\4_2025-02-27' --> 'data\processed_data\NOW\4_2025-02-27.md'
Converted 'data\edgar_documents\NOW\4_2025-03-03' --> 'data\processed_data\NOW\4_2025-03-03.md'
Error processing data\edgar_documents\NOW\4_2025-03-10: File format not allowed: data\edgar_documents\NOW\4_2025-03-10
Converted 'data\edgar_documents\NOW\4_2025-04-17' --> 'data\processed_data\NOW\4_2025-04-17.md'


2025-11-14 17:23:40,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:40,039 - INFO - Going to convert document batch...
2025-11-14 17:23:40,039 - INFO - Processing document 4_2025-05-09
2025-11-14 17:23:40,063 - INFO - Finished converting document 4_2025-05-09 in 0.05 sec.
2025-11-14 17:23:40,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:40,113 - INFO - Going to convert document batch...
2025-11-14 17:23:40,116 - INFO - Processing document 4_2025-05-14
2025-11-14 17:23:40,149 - INFO - Finished converting document 4_2025-05-14 in 0.06 sec.
2025-11-14 17:23:40,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:40,199 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NOW\4_2025-04-29' --> 'data\processed_data\NOW\4_2025-04-29.md'
Converted 'data\edgar_documents\NOW\4_2025-05-09' --> 'data\processed_data\NOW\4_2025-05-09.md'
Converted 'data\edgar_documents\NOW\4_2025-05-14' --> 'data\processed_data\NOW\4_2025-05-14.md'


2025-11-14 17:23:40,199 - INFO - Processing document 4_2025-05-19
2025-11-14 17:23:40,224 - INFO - Finished converting document 4_2025-05-19 in 0.05 sec.
2025-11-14 17:23:40,292 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:23:40,294 - ERROR - Input document 4_2025-05-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:23:40,297 - INFO - Going to convert document batch...
2025-11-14 17:23:40,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23

Converted 'data\edgar_documents\NOW\4_2025-05-19' --> 'data\processed_data\NOW\4_2025-05-19.md'
Error processing data\edgar_documents\NOW\4_2025-05-20: File format not allowed: data\edgar_documents\NOW\4_2025-05-20
Converted 'data\edgar_documents\NOW\4_2025-05-27' --> 'data\processed_data\NOW\4_2025-05-27.md'
Converted 'data\edgar_documents\NOW\4_2025-05-29' --> 'data\processed_data\NOW\4_2025-05-29.md'


2025-11-14 17:23:40,476 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:23:40,478 - ERROR - Input document 4_2025-05-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:23:40,480 - INFO - Going to convert document batch...
2025-11-14 17:23:40,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:40,508 - INFO - Going to convert document batch...
2025-11-14 17:23:40,509 - INFO - Processing document 4_2025-06-03
2025-11-14 17:23:40,547 - INFO - Fin

Error processing data\edgar_documents\NOW\4_2025-05-30: File format not allowed: data\edgar_documents\NOW\4_2025-05-30
Converted 'data\edgar_documents\NOW\4_2025-06-03' --> 'data\processed_data\NOW\4_2025-06-03.md'
Converted 'data\edgar_documents\NOW\4_2025-06-05' --> 'data\processed_data\NOW\4_2025-06-05.md'


2025-11-14 17:23:40,674 - INFO - Processing document 4_2025-07-08
2025-11-14 17:23:40,691 - INFO - Finished converting document 4_2025-07-08 in 0.05 sec.
2025-11-14 17:23:40,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:40,735 - INFO - Going to convert document batch...
2025-11-14 17:23:40,736 - INFO - Processing document 4_2025-07-17
2025-11-14 17:23:40,758 - INFO - Finished converting document 4_2025-07-17 in 0.05 sec.
2025-11-14 17:23:40,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:40,819 - INFO - Going to convert document batch...
2025-11-14 17:23:40,820 - INFO - Processing document 4_2025-07-28
2025-11-14 17:23:40,840 - INFO - Finished converting document 4_2025-07-28 in 0.06 sec.
2025-11-14 17:23:40,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:40,880 - INFO - Going to convert document batch...
2025-11-14 17:23:40,880 - INFO - Processing document 4_2025-07-31


Converted 'data\edgar_documents\NOW\4_2025-07-08' --> 'data\processed_data\NOW\4_2025-07-08.md'
Converted 'data\edgar_documents\NOW\4_2025-07-17' --> 'data\processed_data\NOW\4_2025-07-17.md'
Converted 'data\edgar_documents\NOW\4_2025-07-28' --> 'data\processed_data\NOW\4_2025-07-28.md'


2025-11-14 17:23:41,132 - INFO - Finished converting document 4_2025-07-31 in 0.27 sec.
2025-11-14 17:23:41,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:41,179 - INFO - Going to convert document batch...
2025-11-14 17:23:41,180 - INFO - Processing document 4_2025-08-11
2025-11-14 17:23:41,202 - INFO - Finished converting document 4_2025-08-11 in 0.05 sec.
2025-11-14 17:23:41,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:41,266 - INFO - Going to convert document batch...
2025-11-14 17:23:41,267 - INFO - Processing document 4_2025-08-14
2025-11-14 17:23:41,288 - INFO - Finished converting document 4_2025-08-14 in 0.06 sec.
2025-11-14 17:23:41,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\4_2025-07-31' --> 'data\processed_data\NOW\4_2025-07-31.md'
Converted 'data\edgar_documents\NOW\4_2025-08-11' --> 'data\processed_data\NOW\4_2025-08-11.md'
Converted 'data\edgar_documents\NOW\4_2025-08-14' --> 'data\processed_data\NOW\4_2025-08-14.md'


2025-11-14 17:23:41,331 - INFO - Going to convert document batch...
2025-11-14 17:23:41,331 - INFO - Processing document 4_2025-08-18
2025-11-14 17:23:41,348 - INFO - Finished converting document 4_2025-08-18 in 0.03 sec.
2025-11-14 17:23:41,395 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:41,417 - INFO - Going to convert document batch...
2025-11-14 17:23:41,418 - INFO - Processing document 4_2025-08-19
2025-11-14 17:23:41,457 - INFO - Finished converting document 4_2025-08-19 in 0.09 sec.
2025-11-14 17:23:41,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:41,504 - INFO - Going to convert document batch...
2025-11-14 17:23:41,505 - INFO - Processing document 4_2025-08-21
2025-11-14 17:23:41,523 - INFO - Finished converting document 4_2025-08-21 in 0.03 sec.


Converted 'data\edgar_documents\NOW\4_2025-08-18' --> 'data\processed_data\NOW\4_2025-08-18.md'
Converted 'data\edgar_documents\NOW\4_2025-08-19' --> 'data\processed_data\NOW\4_2025-08-19.md'
Converted 'data\edgar_documents\NOW\4_2025-08-21' --> 'data\processed_data\NOW\4_2025-08-21.md'


2025-11-14 17:23:41,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:41,584 - INFO - Going to convert document batch...
2025-11-14 17:23:41,585 - INFO - Processing document 4_2025-09-02
2025-11-14 17:23:41,613 - INFO - Finished converting document 4_2025-09-02 in 0.06 sec.
2025-11-14 17:23:41,676 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:23:41,677 - ERROR - Input document 4_2025-09-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:23

Converted 'data\edgar_documents\NOW\4_2025-09-02' --> 'data\processed_data\NOW\4_2025-09-02.md'
Error processing data\edgar_documents\NOW\4_2025-09-26: File format not allowed: data\edgar_documents\NOW\4_2025-09-26
Converted 'data\edgar_documents\NOW\8-K_2023-01-25' --> 'data\processed_data\NOW\8-K_2023-01-25.md'
Converted 'data\edgar_documents\NOW\8-K_2023-04-26' --> 'data\processed_data\NOW\8-K_2023-04-26.md'


2025-11-14 17:23:41,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:41,886 - INFO - Going to convert document batch...
2025-11-14 17:23:41,886 - INFO - Processing document 8-K_2023-06-02
2025-11-14 17:23:41,923 - INFO - Finished converting document 8-K_2023-06-02 in 0.06 sec.
2025-11-14 17:23:41,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:41,962 - INFO - Going to convert document batch...
2025-11-14 17:23:41,963 - INFO - Processing document 8-K_2023-07-26
2025-11-14 17:23:41,981 - INFO - Finished converting document 8-K_2023-07-26 in 0.05 sec.
2025-11-14 17:23:42,002 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,014 - INFO - Going to convert document batch...
2025-11-14 17:23:42,015 - INFO - Processing document 8-K_2023-10-25
2025-11-14 17:23:42,032 - INFO - Finished converting document 8-K_2023-10-25 in 0.05 sec.


Converted 'data\edgar_documents\NOW\8-K_2023-05-16' --> 'data\processed_data\NOW\8-K_2023-05-16.md'
Converted 'data\edgar_documents\NOW\8-K_2023-06-02' --> 'data\processed_data\NOW\8-K_2023-06-02.md'
Converted 'data\edgar_documents\NOW\8-K_2023-07-26' --> 'data\processed_data\NOW\8-K_2023-07-26.md'


2025-11-14 17:23:42,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,069 - INFO - Going to convert document batch...
2025-11-14 17:23:42,070 - INFO - Processing document 8-K_2024-01-24
2025-11-14 17:23:42,089 - INFO - Finished converting document 8-K_2024-01-24 in 0.05 sec.
2025-11-14 17:23:42,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,123 - INFO - Going to convert document batch...
2025-11-14 17:23:42,124 - INFO - Processing document 8-K_2024-04-24
2025-11-14 17:23:42,143 - INFO - Finished converting document 8-K_2024-04-24 in 0.05 sec.
2025-11-14 17:23:42,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,181 - INFO - Going to convert document batch...
2025-11-14 17:23:42,181 - INFO - Processing document 8-K_2024-05-23
2025-11-14 17:23:42,210 - INFO - Finished converting document 8-K_2024-05-23 in 0.05 sec.
2025-11-14 17:23:42,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\8-K_2023-10-25' --> 'data\processed_data\NOW\8-K_2023-10-25.md'
Converted 'data\edgar_documents\NOW\8-K_2024-01-24' --> 'data\processed_data\NOW\8-K_2024-01-24.md'
Converted 'data\edgar_documents\NOW\8-K_2024-04-24' --> 'data\processed_data\NOW\8-K_2024-04-24.md'
Converted 'data\edgar_documents\NOW\8-K_2024-05-23' --> 'data\processed_data\NOW\8-K_2024-05-23.md'


2025-11-14 17:23:42,245 - INFO - Going to convert document batch...
2025-11-14 17:23:42,247 - INFO - Processing document 8-K_2024-07-24
2025-11-14 17:23:42,269 - INFO - Finished converting document 8-K_2024-07-24 in 0.05 sec.
2025-11-14 17:23:42,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,307 - INFO - Going to convert document batch...
2025-11-14 17:23:42,308 - INFO - Processing document 8-K_2024-10-23
2025-11-14 17:23:42,330 - INFO - Finished converting document 8-K_2024-10-23 in 0.05 sec.
2025-11-14 17:23:42,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,368 - INFO - Going to convert document batch...
2025-11-14 17:23:42,369 - INFO - Processing document 8-K_2024-12-27
2025-11-14 17:23:42,390 - INFO - Finished converting document 8-K_2024-12-27 in 0.05 sec.
2025-11-14 17:23:42,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,422 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\NOW\8-K_2024-07-24' --> 'data\processed_data\NOW\8-K_2024-07-24.md'
Converted 'data\edgar_documents\NOW\8-K_2024-10-23' --> 'data\processed_data\NOW\8-K_2024-10-23.md'
Converted 'data\edgar_documents\NOW\8-K_2024-12-27' --> 'data\processed_data\NOW\8-K_2024-12-27.md'
Converted 'data\edgar_documents\NOW\8-K_2025-01-29' --> 'data\processed_data\NOW\8-K_2025-01-29.md'


2025-11-14 17:23:42,474 - INFO - Going to convert document batch...
2025-11-14 17:23:42,474 - INFO - Processing document 8-K_2025-02-12
2025-11-14 17:23:42,492 - INFO - Finished converting document 8-K_2025-02-12 in 0.03 sec.
2025-11-14 17:23:42,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,548 - INFO - Going to convert document batch...
2025-11-14 17:23:42,550 - INFO - Processing document 8-K_2025-03-10
2025-11-14 17:23:42,578 - INFO - Finished converting document 8-K_2025-03-10 in 0.08 sec.
2025-11-14 17:23:42,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,613 - INFO - Going to convert document batch...
2025-11-14 17:23:42,613 - INFO - Processing document 8-K_2025-04-23
2025-11-14 17:23:42,633 - INFO - Finished converting document 8-K_2025-04-23 in 0.03 sec.
2025-11-14 17:23:42,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\8-K_2025-02-12' --> 'data\processed_data\NOW\8-K_2025-02-12.md'
Converted 'data\edgar_documents\NOW\8-K_2025-03-10' --> 'data\processed_data\NOW\8-K_2025-03-10.md'
Converted 'data\edgar_documents\NOW\8-K_2025-04-23' --> 'data\processed_data\NOW\8-K_2025-04-23.md'


2025-11-14 17:23:42,703 - INFO - Going to convert document batch...
2025-11-14 17:23:42,704 - INFO - Processing document 8-K_2025-05-27
2025-11-14 17:23:42,736 - INFO - Finished converting document 8-K_2025-05-27 in 0.09 sec.
2025-11-14 17:23:42,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,778 - INFO - Going to convert document batch...
2025-11-14 17:23:42,779 - INFO - Processing document 8-K_2025-05-30
2025-11-14 17:23:42,799 - INFO - Finished converting document 8-K_2025-05-30 in 0.05 sec.
2025-11-14 17:23:42,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,830 - INFO - Going to convert document batch...
2025-11-14 17:23:42,831 - INFO - Processing document 8-K_2025-07-23
2025-11-14 17:23:42,848 - INFO - Finished converting document 8-K_2025-07-23 in 0.03 sec.
2025-11-14 17:23:42,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:23:42,883 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\NOW\8-K_2025-05-27' --> 'data\processed_data\NOW\8-K_2025-05-27.md'
Converted 'data\edgar_documents\NOW\8-K_2025-05-30' --> 'data\processed_data\NOW\8-K_2025-05-30.md'
Converted 'data\edgar_documents\NOW\8-K_2025-07-23' --> 'data\processed_data\NOW\8-K_2025-07-23.md'
Converted 'data\edgar_documents\NOW\8-K_2025-09-26' --> 'data\processed_data\NOW\8-K_2025-09-26.md'


2025-11-14 17:23:42,936 - INFO - Processing document 8-K_2025-10-29
2025-11-14 17:23:42,955 - INFO - Finished converting document 8-K_2025-10-29 in 0.05 sec.
2025-11-14 17:23:42,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\8-K_2025-10-29' --> 'data\processed_data\NOW\8-K_2025-10-29.md'


2025-11-14 17:23:43,399 - INFO - Going to convert document batch...
2025-11-14 17:23:43,400 - INFO - Processing document DEF-14A_2023-04-13
2025-11-14 17:23:45,375 - INFO - Finished converting document DEF-14A_2023-04-13 in 2.41 sec.
2025-11-14 17:23:45,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\DEF-14A_2023-04-13' --> 'data\processed_data\NOW\DEF-14A_2023-04-13.md'


2025-11-14 17:23:46,435 - INFO - Going to convert document batch...
2025-11-14 17:23:46,436 - INFO - Processing document DEF-14A_2024-04-04
2025-11-14 17:23:49,912 - INFO - Finished converting document DEF-14A_2024-04-04 in 3.98 sec.
2025-11-14 17:23:51,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\DEF-14A_2024-04-04' --> 'data\processed_data\NOW\DEF-14A_2024-04-04.md'


2025-11-14 17:23:51,681 - INFO - Going to convert document batch...
2025-11-14 17:23:51,682 - INFO - Processing document DEF-14A_2025-04-04
2025-11-14 17:23:56,052 - INFO - Finished converting document DEF-14A_2025-04-04 in 5.00 sec.
2025-11-14 17:23:57,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NOW\DEF-14A_2025-04-04' --> 'data\processed_data\NOW\DEF-14A_2025-04-04.md'
Processed 158 new files. Errors: 4
Found 187 files to process in data\edgar_documents\NVDA


2025-11-14 17:23:57,854 - INFO - Going to convert document batch...
2025-11-14 17:23:57,855 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:23:57,856 - INFO - Processing document 10-K_2023-02-24
2025-11-14 17:23:58,944 - INFO - Finished converting document 10-K_2023-02-24 in 1.58 sec.
2025-11-14 17:23:59,521 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-K_2023-02-24' --> 'data\processed_data\NVDA\10-K_2023-02-24.md'


2025-11-14 17:24:00,341 - INFO - Going to convert document batch...
2025-11-14 17:24:00,342 - INFO - Processing document 10-K_2024-02-21
2025-11-14 17:24:01,246 - INFO - Finished converting document 10-K_2024-02-21 in 1.77 sec.
2025-11-14 17:24:01,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-K_2024-02-21' --> 'data\processed_data\NVDA\10-K_2024-02-21.md'


2025-11-14 17:24:02,185 - INFO - Going to convert document batch...
2025-11-14 17:24:02,186 - INFO - Processing document 10-K_2025-02-26
2025-11-14 17:24:03,047 - INFO - Finished converting document 10-K_2025-02-26 in 1.33 sec.
2025-11-14 17:24:03,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-K_2025-02-26' --> 'data\processed_data\NVDA\10-K_2025-02-26.md'


2025-11-14 17:24:04,093 - INFO - Going to convert document batch...
2025-11-14 17:24:04,094 - INFO - Processing document 10-Q_2023-05-26
2025-11-14 17:24:04,671 - INFO - Finished converting document 10-Q_2023-05-26 in 0.88 sec.
2025-11-14 17:24:04,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-Q_2023-05-26' --> 'data\processed_data\NVDA\10-Q_2023-05-26.md'


2025-11-14 17:24:05,293 - INFO - Going to convert document batch...
2025-11-14 17:24:05,293 - INFO - Processing document 10-Q_2023-08-28
2025-11-14 17:24:05,939 - INFO - Finished converting document 10-Q_2023-08-28 in 1.00 sec.
2025-11-14 17:24:06,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-Q_2023-08-28' --> 'data\processed_data\NVDA\10-Q_2023-08-28.md'


2025-11-14 17:24:06,889 - INFO - Going to convert document batch...
2025-11-14 17:24:06,890 - INFO - Processing document 10-Q_2023-11-21
2025-11-14 17:24:07,562 - INFO - Finished converting document 10-Q_2023-11-21 in 1.31 sec.
2025-11-14 17:24:07,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-Q_2023-11-21' --> 'data\processed_data\NVDA\10-Q_2023-11-21.md'


2025-11-14 17:24:08,181 - INFO - Going to convert document batch...
2025-11-14 17:24:08,182 - INFO - Processing document 10-Q_2024-05-29
2025-11-14 17:24:08,782 - INFO - Finished converting document 10-Q_2024-05-29 in 0.91 sec.
2025-11-14 17:24:09,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-Q_2024-05-29' --> 'data\processed_data\NVDA\10-Q_2024-05-29.md'


2025-11-14 17:24:09,677 - INFO - Going to convert document batch...
2025-11-14 17:24:09,677 - INFO - Processing document 10-Q_2024-08-28
2025-11-14 17:24:10,288 - INFO - Finished converting document 10-Q_2024-08-28 in 1.23 sec.
2025-11-14 17:24:10,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-Q_2024-08-28' --> 'data\processed_data\NVDA\10-Q_2024-08-28.md'


2025-11-14 17:24:10,937 - INFO - Going to convert document batch...
2025-11-14 17:24:10,938 - INFO - Processing document 10-Q_2024-11-20
2025-11-14 17:24:11,570 - INFO - Finished converting document 10-Q_2024-11-20 in 0.98 sec.
2025-11-14 17:24:11,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-Q_2024-11-20' --> 'data\processed_data\NVDA\10-Q_2024-11-20.md'


2025-11-14 17:24:12,430 - INFO - Going to convert document batch...
2025-11-14 17:24:12,431 - INFO - Processing document 10-Q_2025-05-28
2025-11-14 17:24:12,921 - INFO - Finished converting document 10-Q_2025-05-28 in 1.06 sec.
2025-11-14 17:24:13,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\10-Q_2025-05-28' --> 'data\processed_data\NVDA\10-Q_2025-05-28.md'


2025-11-14 17:24:13,517 - INFO - Going to convert document batch...
2025-11-14 17:24:13,518 - INFO - Processing document 10-Q_2025-08-27
2025-11-14 17:24:14,131 - INFO - Finished converting document 10-Q_2025-08-27 in 0.97 sec.
2025-11-14 17:24:14,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:14,429 - INFO - Going to convert document batch...
2025-11-14 17:24:14,430 - INFO - Processing document 4_2023-01-11
2025-11-14 17:24:14,456 - INFO - Finished converting document 4_2023-01-11 in 0.05 sec.
2025-11-14 17:24:14,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:14,530 - INFO - Going to convert document batch...
2025-11-14 17:24:14,531 - INFO - Processing document 4_2023-01-17
2025-11-14 17:24:14,553 - INFO - Finished converting document 4_2023-01-17 in 0.06 sec.
2025-11-14 17:24:14,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:14,592 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\10-Q_2025-08-27' --> 'data\processed_data\NVDA\10-Q_2025-08-27.md'
Converted 'data\edgar_documents\NVDA\4_2023-01-11' --> 'data\processed_data\NVDA\4_2023-01-11.md'
Converted 'data\edgar_documents\NVDA\4_2023-01-17' --> 'data\processed_data\NVDA\4_2023-01-17.md'


2025-11-14 17:24:14,593 - INFO - Processing document 4_2023-01-27
2025-11-14 17:24:14,611 - INFO - Finished converting document 4_2023-01-27 in 0.03 sec.
2025-11-14 17:24:14,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:14,652 - INFO - Going to convert document batch...
2025-11-14 17:24:14,653 - INFO - Processing document 4_2023-02-28
2025-11-14 17:24:14,670 - INFO - Finished converting document 4_2023-02-28 in 0.05 sec.
2025-11-14 17:24:14,700 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:14,708 - INFO - Going to convert document batch...
2025-11-14 17:24:14,709 - INFO - Processing document 4_2023-03-06
2025-11-14 17:24:14,730 - INFO - Finished converting document 4_2023-03-06 in 0.05 sec.
2025-11-14 17:24:14,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:14,771 - INFO - Going to convert document batch...
2025-11-14 17:24:14,772 - INFO - Processing document 4_2023-03-09
2025-11-14 17:24:14,791 - IN

Converted 'data\edgar_documents\NVDA\4_2023-01-27' --> 'data\processed_data\NVDA\4_2023-01-27.md'
Converted 'data\edgar_documents\NVDA\4_2023-02-28' --> 'data\processed_data\NVDA\4_2023-02-28.md'
Converted 'data\edgar_documents\NVDA\4_2023-03-06' --> 'data\processed_data\NVDA\4_2023-03-06.md'
Converted 'data\edgar_documents\NVDA\4_2023-03-09' --> 'data\processed_data\NVDA\4_2023-03-09.md'


2025-11-14 17:24:14,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:14,856 - INFO - Going to convert document batch...
2025-11-14 17:24:14,857 - INFO - Processing document 4_2023-03-14
2025-11-14 17:24:15,213 - INFO - Finished converting document 4_2023-03-14 in 0.41 sec.
2025-11-14 17:24:15,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:15,263 - INFO - Going to convert document batch...
2025-11-14 17:24:15,264 - INFO - Processing document 4_2023-03-15
2025-11-14 17:24:15,282 - INFO - Finished converting document 4_2023-03-15 in 0.05 sec.
2025-11-14 17:24:15,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:15,327 - INFO - Going to convert document batch...
2025-11-14 17:24:15,328 - INFO - Processing document 4_2023-03-17
2025-11-14 17:24:15,346 - INFO - Finished converting document 4_2023-03-17 in 0.05 sec.
2025-11-14 17:24:15,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\NVDA\4_2023-03-14' --> 'data\processed_data\NVDA\4_2023-03-14.md'
Converted 'data\edgar_documents\NVDA\4_2023-03-15' --> 'data\processed_data\NVDA\4_2023-03-15.md'
Converted 'data\edgar_documents\NVDA\4_2023-03-17' --> 'data\processed_data\NVDA\4_2023-03-17.md'
Converted 'data\edgar_documents\NVDA\4_2023-03-31' --> 'data\processed_data\NVDA\4_2023-03-31.md'


2025-11-14 17:24:15,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:15,449 - INFO - Going to convert document batch...
2025-11-14 17:24:15,450 - INFO - Processing document 4_2023-05-22
2025-11-14 17:24:15,471 - INFO - Finished converting document 4_2023-05-22 in 0.05 sec.
2025-11-14 17:24:15,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:15,516 - INFO - Going to convert document batch...
2025-11-14 17:24:15,517 - INFO - Processing document 4_2023-05-31
2025-11-14 17:24:15,538 - INFO - Finished converting document 4_2023-05-31 in 0.03 sec.
2025-11-14 17:24:15,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:15,612 - INFO - Going to convert document batch...
2025-11-14 17:24:15,613 - INFO - Processing document 4_2023-06-01
2025-11-14 17:24:15,653 - INFO - Finished converting document 4_2023-06-01 in 0.09 sec.


Converted 'data\edgar_documents\NVDA\4_2023-05-22' --> 'data\processed_data\NVDA\4_2023-05-22.md'
Converted 'data\edgar_documents\NVDA\4_2023-05-31' --> 'data\processed_data\NVDA\4_2023-05-31.md'


2025-11-14 17:24:15,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:15,711 - INFO - Going to convert document batch...
2025-11-14 17:24:15,712 - INFO - Processing document 4_2023-06-05
2025-11-14 17:24:15,730 - INFO - Finished converting document 4_2023-06-05 in 0.05 sec.
2025-11-14 17:24:15,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:15,802 - INFO - Going to convert document batch...
2025-11-14 17:24:15,804 - INFO - Processing document 4_2023-06-06
2025-11-14 17:24:15,829 - INFO - Finished converting document 4_2023-06-06 in 0.06 sec.
2025-11-14 17:24:15,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\4_2023-06-01' --> 'data\processed_data\NVDA\4_2023-06-01.md'
Converted 'data\edgar_documents\NVDA\4_2023-06-05' --> 'data\processed_data\NVDA\4_2023-06-05.md'
Converted 'data\edgar_documents\NVDA\4_2023-06-06' --> 'data\processed_data\NVDA\4_2023-06-06.md'


2025-11-14 17:24:15,902 - INFO - Going to convert document batch...
2025-11-14 17:24:15,903 - INFO - Processing document 4_2023-06-09
2025-11-14 17:24:15,927 - INFO - Finished converting document 4_2023-06-09 in 0.06 sec.
2025-11-14 17:24:15,975 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:15,982 - INFO - Going to convert document batch...
2025-11-14 17:24:15,983 - INFO - Processing document 4_2023-06-12
2025-11-14 17:24:16,004 - INFO - Finished converting document 4_2023-06-12 in 0.05 sec.
2025-11-14 17:24:16,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,053 - INFO - Going to convert document batch...
2025-11-14 17:24:16,054 - INFO - Processing document 4_2023-06-14
2025-11-14 17:24:16,087 - INFO - Finished converting document 4_2023-06-14 in 0.05 sec.
2025-11-14 17:24:16,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,139 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2023-06-09' --> 'data\processed_data\NVDA\4_2023-06-09.md'
Converted 'data\edgar_documents\NVDA\4_2023-06-12' --> 'data\processed_data\NVDA\4_2023-06-12.md'
Converted 'data\edgar_documents\NVDA\4_2023-06-14' --> 'data\processed_data\NVDA\4_2023-06-14.md'


2025-11-14 17:24:16,140 - INFO - Processing document 4_2023-06-15
2025-11-14 17:24:16,159 - INFO - Finished converting document 4_2023-06-15 in 0.03 sec.
2025-11-14 17:24:16,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,219 - INFO - Going to convert document batch...
2025-11-14 17:24:16,221 - INFO - Processing document 4_2023-06-16
2025-11-14 17:24:16,248 - INFO - Finished converting document 4_2023-06-16 in 0.06 sec.
2025-11-14 17:24:16,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,297 - INFO - Going to convert document batch...
2025-11-14 17:24:16,297 - INFO - Processing document 4_2023-06-21
2025-11-14 17:24:16,323 - INFO - Finished converting document 4_2023-06-21 in 0.05 sec.
2025-11-14 17:24:16,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,372 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2023-06-15' --> 'data\processed_data\NVDA\4_2023-06-15.md'
Converted 'data\edgar_documents\NVDA\4_2023-06-16' --> 'data\processed_data\NVDA\4_2023-06-16.md'
Converted 'data\edgar_documents\NVDA\4_2023-06-21' --> 'data\processed_data\NVDA\4_2023-06-21.md'


2025-11-14 17:24:16,373 - INFO - Processing document 4_2023-06-23
2025-11-14 17:24:16,393 - INFO - Finished converting document 4_2023-06-23 in 0.05 sec.
2025-11-14 17:24:16,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,443 - INFO - Going to convert document batch...
2025-11-14 17:24:16,444 - INFO - Processing document 4_2023-06-27
2025-11-14 17:24:16,464 - INFO - Finished converting document 4_2023-06-27 in 0.05 sec.
2025-11-14 17:24:16,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,509 - INFO - Going to convert document batch...
2025-11-14 17:24:16,510 - INFO - Processing document 4_2023-08-09
2025-11-14 17:24:16,527 - INFO - Finished converting document 4_2023-08-09 in 0.05 sec.
2025-11-14 17:24:16,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,571 - INFO - Going to convert document batch...
2025-11-14 17:24:16,572 - INFO - Processing document 4_2023-08-30
2025-11-14 17:24:16,594 - IN

Converted 'data\edgar_documents\NVDA\4_2023-06-23' --> 'data\processed_data\NVDA\4_2023-06-23.md'
Converted 'data\edgar_documents\NVDA\4_2023-06-27' --> 'data\processed_data\NVDA\4_2023-06-27.md'
Converted 'data\edgar_documents\NVDA\4_2023-08-09' --> 'data\processed_data\NVDA\4_2023-08-09.md'


2025-11-14 17:24:16,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,654 - INFO - Going to convert document batch...
2025-11-14 17:24:16,654 - INFO - Processing document 4_2023-09-06
2025-11-14 17:24:16,707 - INFO - Finished converting document 4_2023-09-06 in 0.09 sec.
2025-11-14 17:24:16,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,804 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2023-08-30' --> 'data\processed_data\NVDA\4_2023-08-30.md'
Converted 'data\edgar_documents\NVDA\4_2023-09-06' --> 'data\processed_data\NVDA\4_2023-09-06.md'


2025-11-14 17:24:16,806 - INFO - Processing document 4_2023-09-11
2025-11-14 17:24:16,857 - INFO - Finished converting document 4_2023-09-11 in 0.09 sec.
2025-11-14 17:24:16,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:16,936 - INFO - Going to convert document batch...
2025-11-14 17:24:16,937 - INFO - Processing document 4_2023-09-13
2025-11-14 17:24:16,983 - INFO - Finished converting document 4_2023-09-13 in 0.08 sec.
2025-11-14 17:24:17,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,070 - INFO - Going to convert document batch...
2025-11-14 17:24:17,071 - INFO - Processing document 4_2023-09-18
2025-11-14 17:24:17,112 - INFO - Finished converting document 4_2023-09-18 in 0.09 sec.


Converted 'data\edgar_documents\NVDA\4_2023-09-11' --> 'data\processed_data\NVDA\4_2023-09-11.md'
Converted 'data\edgar_documents\NVDA\4_2023-09-13' --> 'data\processed_data\NVDA\4_2023-09-13.md'


2025-11-14 17:24:17,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,184 - INFO - Going to convert document batch...
2025-11-14 17:24:17,186 - INFO - Processing document 4_2023-09-22
2025-11-14 17:24:17,223 - INFO - Finished converting document 4_2023-09-22 in 0.08 sec.
2025-11-14 17:24:17,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,276 - INFO - Going to convert document batch...
2025-11-14 17:24:17,277 - INFO - Processing document 4_2023-10-10
2025-11-14 17:24:17,302 - INFO - Finished converting document 4_2023-10-10 in 0.05 sec.


Converted 'data\edgar_documents\NVDA\4_2023-09-18' --> 'data\processed_data\NVDA\4_2023-09-18.md'
Converted 'data\edgar_documents\NVDA\4_2023-09-22' --> 'data\processed_data\NVDA\4_2023-09-22.md'


2025-11-14 17:24:17,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,352 - INFO - Going to convert document batch...
2025-11-14 17:24:17,353 - INFO - Processing document 4_2023-11-28
2025-11-14 17:24:17,371 - INFO - Finished converting document 4_2023-11-28 in 0.05 sec.
2025-11-14 17:24:17,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,413 - INFO - Going to convert document batch...
2025-11-14 17:24:17,414 - INFO - Processing document 4_2023-11-30
2025-11-14 17:24:17,433 - INFO - Finished converting document 4_2023-11-30 in 0.05 sec.
2025-11-14 17:24:17,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,478 - INFO - Going to convert document batch...
2025-11-14 17:24:17,479 - INFO - Processing document 4_2023-12-01


Converted 'data\edgar_documents\NVDA\4_2023-10-10' --> 'data\processed_data\NVDA\4_2023-10-10.md'
Converted 'data\edgar_documents\NVDA\4_2023-11-28' --> 'data\processed_data\NVDA\4_2023-11-28.md'
Converted 'data\edgar_documents\NVDA\4_2023-11-30' --> 'data\processed_data\NVDA\4_2023-11-30.md'


2025-11-14 17:24:17,516 - INFO - Finished converting document 4_2023-12-01 in 0.06 sec.
2025-11-14 17:24:17,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,592 - INFO - Going to convert document batch...
2025-11-14 17:24:17,593 - INFO - Processing document 4_2023-12-15
2025-11-14 17:24:17,621 - INFO - Finished converting document 4_2023-12-15 in 0.08 sec.
2025-11-14 17:24:17,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,665 - INFO - Going to convert document batch...
2025-11-14 17:24:17,666 - INFO - Processing document 4_2023-12-19
2025-11-14 17:24:17,686 - INFO - Finished converting document 4_2023-12-19 in 0.05 sec.
2025-11-14 17:24:17,716 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,724 - INFO - Going to convert document batch...
2025-11-14 17:24:17,725 - INFO - Processing document 4_2023-12-20
2025-11-14 17:24:17,743 - INFO - Finished converting document 4_2023-12-20 in 0.03 sec.


Converted 'data\edgar_documents\NVDA\4_2023-12-01' --> 'data\processed_data\NVDA\4_2023-12-01.md'
Converted 'data\edgar_documents\NVDA\4_2023-12-15' --> 'data\processed_data\NVDA\4_2023-12-15.md'
Converted 'data\edgar_documents\NVDA\4_2023-12-19' --> 'data\processed_data\NVDA\4_2023-12-19.md'


2025-11-14 17:24:17,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,784 - INFO - Going to convert document batch...
2025-11-14 17:24:17,785 - INFO - Processing document 4_2024-01-09
2025-11-14 17:24:17,807 - INFO - Finished converting document 4_2024-01-09 in 0.05 sec.
2025-11-14 17:24:17,844 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,857 - INFO - Going to convert document batch...
2025-11-14 17:24:17,858 - INFO - Processing document 4_2024-01-12
2025-11-14 17:24:17,886 - INFO - Finished converting document 4_2024-01-12 in 0.06 sec.
2025-11-14 17:24:17,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:17,952 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2023-12-20' --> 'data\processed_data\NVDA\4_2023-12-20.md'
Converted 'data\edgar_documents\NVDA\4_2024-01-09' --> 'data\processed_data\NVDA\4_2024-01-09.md'
Converted 'data\edgar_documents\NVDA\4_2024-01-12' --> 'data\processed_data\NVDA\4_2024-01-12.md'


2025-11-14 17:24:17,953 - INFO - Processing document 4_2024-01-16
2025-11-14 17:24:17,973 - INFO - Finished converting document 4_2024-01-16 in 0.06 sec.
2025-11-14 17:24:18,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,018 - INFO - Going to convert document batch...
2025-11-14 17:24:18,019 - INFO - Processing document 4_2024-02-27
2025-11-14 17:24:18,042 - INFO - Finished converting document 4_2024-02-27 in 0.05 sec.
2025-11-14 17:24:18,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,101 - INFO - Going to convert document batch...
2025-11-14 17:24:18,102 - INFO - Processing document 4_2024-03-06
2025-11-14 17:24:18,130 - INFO - Finished converting document 4_2024-03-06 in 0.06 sec.
2025-11-14 17:24:18,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,172 - INFO - Going to convert document batch...
2025-11-14 17:24:18,172 - INFO - Processing document 4_2024-03-08
2025-11-14 17:24:18,194 - IN

Converted 'data\edgar_documents\NVDA\4_2024-01-16' --> 'data\processed_data\NVDA\4_2024-01-16.md'
Converted 'data\edgar_documents\NVDA\4_2024-02-27' --> 'data\processed_data\NVDA\4_2024-02-27.md'
Converted 'data\edgar_documents\NVDA\4_2024-03-06' --> 'data\processed_data\NVDA\4_2024-03-06.md'


2025-11-14 17:24:18,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,240 - INFO - Going to convert document batch...
2025-11-14 17:24:18,241 - INFO - Processing document 4_2024-03-11
2025-11-14 17:24:18,263 - INFO - Finished converting document 4_2024-03-11 in 0.05 sec.
2025-11-14 17:24:18,314 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,322 - INFO - Going to convert document batch...
2025-11-14 17:24:18,323 - INFO - Processing document 4_2024-03-12
2025-11-14 17:24:18,343 - INFO - Finished converting document 4_2024-03-12 in 0.06 sec.
2025-11-14 17:24:18,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,397 - INFO - Going to convert document batch...
2025-11-14 17:24:18,398 - INFO - Processing document 4_2024-03-22
2025-11-14 17:24:18,415 - INFO - Finished converting document 4_2024-03-22 in 0.05 sec.


Converted 'data\edgar_documents\NVDA\4_2024-03-08' --> 'data\processed_data\NVDA\4_2024-03-08.md'
Converted 'data\edgar_documents\NVDA\4_2024-03-11' --> 'data\processed_data\NVDA\4_2024-03-11.md'
Converted 'data\edgar_documents\NVDA\4_2024-03-12' --> 'data\processed_data\NVDA\4_2024-03-12.md'


2025-11-14 17:24:18,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,454 - INFO - Going to convert document batch...
2025-11-14 17:24:18,455 - INFO - Processing document 4_2024-03-26
2025-11-14 17:24:18,476 - INFO - Finished converting document 4_2024-03-26 in 0.03 sec.
2025-11-14 17:24:18,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,518 - INFO - Going to convert document batch...
2025-11-14 17:24:18,519 - INFO - Processing document 4_2024-03-27
2025-11-14 17:24:18,539 - INFO - Finished converting document 4_2024-03-27 in 0.03 sec.
2025-11-14 17:24:18,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,600 - INFO - Going to convert document batch...
2025-11-14 17:24:18,601 - INFO - Processing document 4_2024-04-01
2025-11-14 17:24:18,621 - INFO - Finished converting document 4_2024-04-01 in 0.06 sec.


Converted 'data\edgar_documents\NVDA\4_2024-03-22' --> 'data\processed_data\NVDA\4_2024-03-22.md'
Converted 'data\edgar_documents\NVDA\4_2024-03-26' --> 'data\processed_data\NVDA\4_2024-03-26.md'
Converted 'data\edgar_documents\NVDA\4_2024-03-27' --> 'data\processed_data\NVDA\4_2024-03-27.md'


2025-11-14 17:24:18,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,664 - INFO - Going to convert document batch...
2025-11-14 17:24:18,666 - INFO - Processing document 4_2024-04-03


Converted 'data\edgar_documents\NVDA\4_2024-04-01' --> 'data\processed_data\NVDA\4_2024-04-01.md'


2025-11-14 17:24:18,935 - INFO - Finished converting document 4_2024-04-03 in 0.30 sec.
2025-11-14 17:24:18,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:18,984 - INFO - Going to convert document batch...
2025-11-14 17:24:18,985 - INFO - Processing document 4_2024-04-09
2025-11-14 17:24:19,013 - INFO - Finished converting document 4_2024-04-09 in 0.06 sec.
2025-11-14 17:24:19,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,058 - INFO - Going to convert document batch...
2025-11-14 17:24:19,059 - INFO - Processing document 4_2024-04-10
2025-11-14 17:24:19,086 - INFO - Finished converting document 4_2024-04-10 in 0.05 sec.
2025-11-14 17:24:19,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,127 - INFO - Going to convert document batch...
2025-11-14 17:24:19,128 - INFO - Processing document 4_2024-05-29


Converted 'data\edgar_documents\NVDA\4_2024-04-03' --> 'data\processed_data\NVDA\4_2024-04-03.md'
Converted 'data\edgar_documents\NVDA\4_2024-04-09' --> 'data\processed_data\NVDA\4_2024-04-09.md'
Converted 'data\edgar_documents\NVDA\4_2024-04-10' --> 'data\processed_data\NVDA\4_2024-04-10.md'


2025-11-14 17:24:19,149 - INFO - Finished converting document 4_2024-05-29 in 0.03 sec.
2025-11-14 17:24:19,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,191 - INFO - Going to convert document batch...
2025-11-14 17:24:19,192 - INFO - Processing document 4_2024-05-30
2025-11-14 17:24:19,212 - INFO - Finished converting document 4_2024-05-30 in 0.03 sec.
2025-11-14 17:24:19,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,260 - INFO - Going to convert document batch...
2025-11-14 17:24:19,261 - INFO - Processing document 4_2024-05-31
2025-11-14 17:24:19,285 - INFO - Finished converting document 4_2024-05-31 in 0.05 sec.
2025-11-14 17:24:19,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,342 - INFO - Going to convert document batch...
2025-11-14 17:24:19,343 - INFO - Processing document 4_2024-06-05


Converted 'data\edgar_documents\NVDA\4_2024-05-29' --> 'data\processed_data\NVDA\4_2024-05-29.md'
Converted 'data\edgar_documents\NVDA\4_2024-05-30' --> 'data\processed_data\NVDA\4_2024-05-30.md'
Converted 'data\edgar_documents\NVDA\4_2024-05-31' --> 'data\processed_data\NVDA\4_2024-05-31.md'


2025-11-14 17:24:19,401 - INFO - Finished converting document 4_2024-06-05 in 0.09 sec.
2025-11-14 17:24:19,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,473 - INFO - Going to convert document batch...
2025-11-14 17:24:19,474 - INFO - Processing document 4_2024-06-07
2025-11-14 17:24:19,498 - INFO - Finished converting document 4_2024-06-07 in 0.05 sec.
2025-11-14 17:24:19,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,576 - INFO - Going to convert document batch...
2025-11-14 17:24:19,577 - INFO - Processing document 4_2024-06-10
2025-11-14 17:24:19,607 - INFO - Finished converting document 4_2024-06-10 in 0.08 sec.


Converted 'data\edgar_documents\NVDA\4_2024-06-05' --> 'data\processed_data\NVDA\4_2024-06-05.md'
Converted 'data\edgar_documents\NVDA\4_2024-06-07' --> 'data\processed_data\NVDA\4_2024-06-07.md'
Converted 'data\edgar_documents\NVDA\4_2024-06-10' --> 'data\processed_data\NVDA\4_2024-06-10.md'


2025-11-14 17:24:19,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,671 - INFO - Going to convert document batch...
2025-11-14 17:24:19,672 - INFO - Processing document 4_2024-06-13
2025-11-14 17:24:19,717 - INFO - Finished converting document 4_2024-06-13 in 0.08 sec.
2025-11-14 17:24:19,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,769 - INFO - Going to convert document batch...
2025-11-14 17:24:19,770 - INFO - Processing document 4_2024-06-17
2025-11-14 17:24:19,809 - INFO - Finished converting document 4_2024-06-17 in 0.08 sec.
2025-11-14 17:24:19,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:19,865 - INFO - Going to convert document batch...
2025-11-14 17:24:19,865 - INFO - Processing document 4_2024-06-20
2025-11-14 17:24:19,887 - INFO - Finished converting document 4_2024-06-20 in 0.05 sec.
2025-11-14 17:24:19,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\4_2024-06-13' --> 'data\processed_data\NVDA\4_2024-06-13.md'
Converted 'data\edgar_documents\NVDA\4_2024-06-17' --> 'data\processed_data\NVDA\4_2024-06-17.md'
Converted 'data\edgar_documents\NVDA\4_2024-06-20' --> 'data\processed_data\NVDA\4_2024-06-20.md'


2025-11-14 17:24:19,951 - INFO - Going to convert document batch...
2025-11-14 17:24:19,952 - INFO - Processing document 4_2024-06-21
2025-11-14 17:24:20,017 - INFO - Finished converting document 4_2024-06-21 in 0.11 sec.
2025-11-14 17:24:20,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,109 - INFO - Going to convert document batch...
2025-11-14 17:24:20,110 - INFO - Processing document 4_2024-06-26
2025-11-14 17:24:20,126 - INFO - Finished converting document 4_2024-06-26 in 0.05 sec.
2025-11-14 17:24:20,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,174 - INFO - Going to convert document batch...
2025-11-14 17:24:20,175 - INFO - Processing document 4_2024-06-28
2025-11-14 17:24:20,214 - INFO - Finished converting document 4_2024-06-28 in 0.08 sec.


Converted 'data\edgar_documents\NVDA\4_2024-06-21' --> 'data\processed_data\NVDA\4_2024-06-21.md'
Converted 'data\edgar_documents\NVDA\4_2024-06-26' --> 'data\processed_data\NVDA\4_2024-06-26.md'
Converted 'data\edgar_documents\NVDA\4_2024-06-28' --> 'data\processed_data\NVDA\4_2024-06-28.md'


2025-11-14 17:24:20,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,289 - INFO - Going to convert document batch...
2025-11-14 17:24:20,290 - INFO - Processing document 4_2024-07-01
2025-11-14 17:24:20,309 - INFO - Finished converting document 4_2024-07-01 in 0.06 sec.
2025-11-14 17:24:20,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,365 - INFO - Going to convert document batch...
2025-11-14 17:24:20,366 - INFO - Processing document 4_2024-07-02
2025-11-14 17:24:20,409 - INFO - Finished converting document 4_2024-07-02 in 0.08 sec.
2025-11-14 17:24:20,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,472 - INFO - Going to convert document batch...
2025-11-14 17:24:20,473 - INFO - Processing document 4_2024-07-05
2025-11-14 17:24:20,510 - INFO - Finished converting document 4_2024-07-05 in 0.08 sec.


Converted 'data\edgar_documents\NVDA\4_2024-07-01' --> 'data\processed_data\NVDA\4_2024-07-01.md'
Converted 'data\edgar_documents\NVDA\4_2024-07-02' --> 'data\processed_data\NVDA\4_2024-07-02.md'


2025-11-14 17:24:20,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,569 - INFO - Going to convert document batch...
2025-11-14 17:24:20,569 - INFO - Processing document 4_2024-07-09
2025-11-14 17:24:20,606 - INFO - Finished converting document 4_2024-07-09 in 0.06 sec.
2025-11-14 17:24:20,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,668 - INFO - Going to convert document batch...
2025-11-14 17:24:20,670 - INFO - Processing document 4_2024-07-11


Converted 'data\edgar_documents\NVDA\4_2024-07-05' --> 'data\processed_data\NVDA\4_2024-07-05.md'
Converted 'data\edgar_documents\NVDA\4_2024-07-09' --> 'data\processed_data\NVDA\4_2024-07-09.md'


2025-11-14 17:24:20,732 - INFO - Finished converting document 4_2024-07-11 in 0.09 sec.
2025-11-14 17:24:20,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,800 - INFO - Going to convert document batch...
2025-11-14 17:24:20,801 - INFO - Processing document 4_2024-07-15
2025-11-14 17:24:20,820 - INFO - Finished converting document 4_2024-07-15 in 0.05 sec.
2025-11-14 17:24:20,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,869 - INFO - Going to convert document batch...
2025-11-14 17:24:20,869 - INFO - Processing document 4_2024-07-17
2025-11-14 17:24:20,908 - INFO - Finished converting document 4_2024-07-17 in 0.06 sec.


Converted 'data\edgar_documents\NVDA\4_2024-07-11' --> 'data\processed_data\NVDA\4_2024-07-11.md'
Converted 'data\edgar_documents\NVDA\4_2024-07-15' --> 'data\processed_data\NVDA\4_2024-07-15.md'
Converted 'data\edgar_documents\NVDA\4_2024-07-17' --> 'data\processed_data\NVDA\4_2024-07-17.md'


2025-11-14 17:24:20,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:20,981 - INFO - Going to convert document batch...
2025-11-14 17:24:20,981 - INFO - Processing document 4_2024-07-18
2025-11-14 17:24:21,003 - INFO - Finished converting document 4_2024-07-18 in 0.06 sec.
2025-11-14 17:24:21,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:21,058 - INFO - Going to convert document batch...
2025-11-14 17:24:21,059 - INFO - Processing document 4_2024-07-19
2025-11-14 17:24:21,101 - INFO - Finished converting document 4_2024-07-19 in 0.06 sec.
2025-11-14 17:24:21,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:21,172 - INFO - Going to convert document batch...
2025-11-14 17:24:21,172 - INFO - Processing document 4_2024-07-23
2025-11-14 17:24:21,211 - INFO - Finished converting document 4_2024-07-23 in 0.06 sec.


Converted 'data\edgar_documents\NVDA\4_2024-07-18' --> 'data\processed_data\NVDA\4_2024-07-18.md'
Converted 'data\edgar_documents\NVDA\4_2024-07-19' --> 'data\processed_data\NVDA\4_2024-07-19.md'
Converted 'data\edgar_documents\NVDA\4_2024-07-23' --> 'data\processed_data\NVDA\4_2024-07-23.md'


2025-11-14 17:24:21,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:21,272 - INFO - Going to convert document batch...
2025-11-14 17:24:21,273 - INFO - Processing document 4_2024-07-25
2025-11-14 17:24:21,339 - INFO - Finished converting document 4_2024-07-25 in 0.11 sec.
2025-11-14 17:24:21,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:21,409 - INFO - Going to convert document batch...
2025-11-14 17:24:21,410 - INFO - Processing document 4_2024-07-29
2025-11-14 17:24:21,455 - INFO - Finished converting document 4_2024-07-29 in 0.08 sec.
2025-11-14 17:24:21,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:21,524 - INFO - Going to convert document batch...
2025-11-14 17:24:21,525 - INFO - Processing document 4_2024-07-31
2025-11-14 17:24:21,571 - INFO - Finished converting document 4_2024-07-31 in 0.08 sec.


Converted 'data\edgar_documents\NVDA\4_2024-07-25' --> 'data\processed_data\NVDA\4_2024-07-25.md'
Converted 'data\edgar_documents\NVDA\4_2024-07-29' --> 'data\processed_data\NVDA\4_2024-07-29.md'


2025-11-14 17:24:21,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:21,646 - INFO - Going to convert document batch...
2025-11-14 17:24:21,648 - INFO - Processing document 4_2024-08-02
2025-11-14 17:24:21,713 - INFO - Finished converting document 4_2024-08-02 in 0.09 sec.
2025-11-14 17:24:21,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\4_2024-07-31' --> 'data\processed_data\NVDA\4_2024-07-31.md'
Converted 'data\edgar_documents\NVDA\4_2024-08-02' --> 'data\processed_data\NVDA\4_2024-08-02.md'


2025-11-14 17:24:22,000 - INFO - Going to convert document batch...
2025-11-14 17:24:22,001 - INFO - Processing document 4_2024-08-06
2025-11-14 17:24:22,059 - INFO - Finished converting document 4_2024-08-06 in 0.30 sec.
2025-11-14 17:24:22,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:22,148 - INFO - Going to convert document batch...
2025-11-14 17:24:22,149 - INFO - Processing document 4_2024-08-08
2025-11-14 17:24:22,199 - INFO - Finished converting document 4_2024-08-08 in 0.09 sec.
2025-11-14 17:24:22,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:22,293 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2024-08-06' --> 'data\processed_data\NVDA\4_2024-08-06.md'
Converted 'data\edgar_documents\NVDA\4_2024-08-08' --> 'data\processed_data\NVDA\4_2024-08-08.md'


2025-11-14 17:24:22,294 - INFO - Processing document 4_2024-08-12
2025-11-14 17:24:22,335 - INFO - Finished converting document 4_2024-08-12 in 0.09 sec.
2025-11-14 17:24:22,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:22,420 - INFO - Going to convert document batch...
2025-11-14 17:24:22,421 - INFO - Processing document 4_2024-09-04
2025-11-14 17:24:22,470 - INFO - Finished converting document 4_2024-09-04 in 0.09 sec.
2025-11-14 17:24:22,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:22,549 - INFO - Going to convert document batch...
2025-11-14 17:24:22,549 - INFO - Processing document 4_2024-09-06


Converted 'data\edgar_documents\NVDA\4_2024-08-12' --> 'data\processed_data\NVDA\4_2024-08-12.md'
Converted 'data\edgar_documents\NVDA\4_2024-09-04' --> 'data\processed_data\NVDA\4_2024-09-04.md'


2025-11-14 17:24:22,590 - INFO - Finished converting document 4_2024-09-06 in 0.09 sec.
2025-11-14 17:24:22,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:22,681 - INFO - Going to convert document batch...
2025-11-14 17:24:22,682 - INFO - Processing document 4_2024-09-10
2025-11-14 17:24:22,724 - INFO - Finished converting document 4_2024-09-10 in 0.08 sec.
2025-11-14 17:24:22,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:22,790 - INFO - Going to convert document batch...
2025-11-14 17:24:22,792 - INFO - Processing document 4_2024-09-12
2025-11-14 17:24:22,838 - INFO - Finished converting document 4_2024-09-12 in 0.09 sec.


Converted 'data\edgar_documents\NVDA\4_2024-09-06' --> 'data\processed_data\NVDA\4_2024-09-06.md'
Converted 'data\edgar_documents\NVDA\4_2024-09-10' --> 'data\processed_data\NVDA\4_2024-09-10.md'


2025-11-14 17:24:22,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:22,907 - INFO - Going to convert document batch...
2025-11-14 17:24:22,908 - INFO - Processing document 4_2024-09-16
2025-11-14 17:24:22,943 - INFO - Finished converting document 4_2024-09-16 in 0.06 sec.
2025-11-14 17:24:22,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:22,998 - INFO - Going to convert document batch...
2025-11-14 17:24:22,999 - INFO - Processing document 4_2024-09-20
2025-11-14 17:24:23,022 - INFO - Finished converting document 4_2024-09-20 in 0.05 sec.
2025-11-14 17:24:23,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,064 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2024-09-12' --> 'data\processed_data\NVDA\4_2024-09-12.md'
Converted 'data\edgar_documents\NVDA\4_2024-09-16' --> 'data\processed_data\NVDA\4_2024-09-16.md'
Converted 'data\edgar_documents\NVDA\4_2024-09-20' --> 'data\processed_data\NVDA\4_2024-09-20.md'


2025-11-14 17:24:23,065 - INFO - Processing document 4_2024-09-23
2025-11-14 17:24:23,090 - INFO - Finished converting document 4_2024-09-23 in 0.05 sec.
2025-11-14 17:24:23,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,160 - INFO - Going to convert document batch...
2025-11-14 17:24:23,161 - INFO - Processing document 4_2024-09-24
2025-11-14 17:24:23,186 - INFO - Finished converting document 4_2024-09-24 in 0.06 sec.
2025-11-14 17:24:23,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,228 - INFO - Going to convert document batch...
2025-11-14 17:24:23,229 - INFO - Processing document 4_2024-09-26
2025-11-14 17:24:23,248 - INFO - Finished converting document 4_2024-09-26 in 0.05 sec.
2025-11-14 17:24:23,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,313 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2024-09-23' --> 'data\processed_data\NVDA\4_2024-09-23.md'
Converted 'data\edgar_documents\NVDA\4_2024-09-24' --> 'data\processed_data\NVDA\4_2024-09-24.md'
Converted 'data\edgar_documents\NVDA\4_2024-09-26' --> 'data\processed_data\NVDA\4_2024-09-26.md'


2025-11-14 17:24:23,314 - INFO - Processing document 4_2024-10-01
2025-11-14 17:24:23,335 - INFO - Finished converting document 4_2024-10-01 in 0.06 sec.
2025-11-14 17:24:23,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,382 - INFO - Going to convert document batch...
2025-11-14 17:24:23,383 - INFO - Processing document 4_2024-10-07
2025-11-14 17:24:23,405 - INFO - Finished converting document 4_2024-10-07 in 0.05 sec.
2025-11-14 17:24:23,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,466 - INFO - Going to convert document batch...
2025-11-14 17:24:23,466 - INFO - Processing document 4_2024-10-11
2025-11-14 17:24:23,485 - INFO - Finished converting document 4_2024-10-11 in 0.06 sec.
2025-11-14 17:24:23,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,526 - INFO - Going to convert document batch...
2025-11-14 17:24:23,527 - INFO - Processing document 4_2024-11-27


Converted 'data\edgar_documents\NVDA\4_2024-10-01' --> 'data\processed_data\NVDA\4_2024-10-01.md'
Converted 'data\edgar_documents\NVDA\4_2024-10-07' --> 'data\processed_data\NVDA\4_2024-10-07.md'
Converted 'data\edgar_documents\NVDA\4_2024-10-11' --> 'data\processed_data\NVDA\4_2024-10-11.md'


2025-11-14 17:24:23,545 - INFO - Finished converting document 4_2024-11-27 in 0.05 sec.
2025-11-14 17:24:23,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,586 - INFO - Going to convert document batch...
2025-11-14 17:24:23,586 - INFO - Processing document 4_2024-12-09
2025-11-14 17:24:23,616 - INFO - Finished converting document 4_2024-12-09 in 0.05 sec.
2025-11-14 17:24:23,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,704 - INFO - Going to convert document batch...
2025-11-14 17:24:23,705 - INFO - Processing document 4_2024-12-13
2025-11-14 17:24:23,737 - INFO - Finished converting document 4_2024-12-13 in 0.08 sec.


Converted 'data\edgar_documents\NVDA\4_2024-11-27' --> 'data\processed_data\NVDA\4_2024-11-27.md'
Converted 'data\edgar_documents\NVDA\4_2024-12-09' --> 'data\processed_data\NVDA\4_2024-12-09.md'
Converted 'data\edgar_documents\NVDA\4_2024-12-13' --> 'data\processed_data\NVDA\4_2024-12-13.md'


2025-11-14 17:24:23,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,812 - INFO - Going to convert document batch...
2025-11-14 17:24:23,813 - INFO - Processing document 4_2024-12-18
2025-11-14 17:24:23,841 - INFO - Finished converting document 4_2024-12-18 in 0.08 sec.
2025-11-14 17:24:23,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,888 - INFO - Going to convert document batch...
2025-11-14 17:24:23,889 - INFO - Processing document 4_2024-12-20
2025-11-14 17:24:23,909 - INFO - Finished converting document 4_2024-12-20 in 0.05 sec.
2025-11-14 17:24:23,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:23,956 - INFO - Going to convert document batch...
2025-11-14 17:24:23,957 - INFO - Processing document 4_2025-01-08
2025-11-14 17:24:23,986 - INFO - Finished converting document 4_2025-01-08 in 0.06 sec.
2025-11-14 17:24:24,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\4_2024-12-18' --> 'data\processed_data\NVDA\4_2024-12-18.md'
Converted 'data\edgar_documents\NVDA\4_2024-12-20' --> 'data\processed_data\NVDA\4_2024-12-20.md'
Converted 'data\edgar_documents\NVDA\4_2025-01-08' --> 'data\processed_data\NVDA\4_2025-01-08.md'


2025-11-14 17:24:24,048 - INFO - Going to convert document batch...
2025-11-14 17:24:24,050 - INFO - Processing document 4_2025-03-04
2025-11-14 17:24:24,073 - INFO - Finished converting document 4_2025-03-04 in 0.06 sec.
2025-11-14 17:24:24,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:24,139 - INFO - Going to convert document batch...
2025-11-14 17:24:24,141 - INFO - Processing document 4_2025-03-05
2025-11-14 17:24:24,171 - INFO - Finished converting document 4_2025-03-05 in 0.08 sec.
2025-11-14 17:24:24,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:24,216 - INFO - Going to convert document batch...
2025-11-14 17:24:24,217 - INFO - Processing document 4_2025-03-12
2025-11-14 17:24:24,239 - INFO - Finished converting document 4_2025-03-12 in 0.05 sec.
2025-11-14 17:24:24,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\4_2025-03-04' --> 'data\processed_data\NVDA\4_2025-03-04.md'
Converted 'data\edgar_documents\NVDA\4_2025-03-05' --> 'data\processed_data\NVDA\4_2025-03-05.md'
Converted 'data\edgar_documents\NVDA\4_2025-03-12' --> 'data\processed_data\NVDA\4_2025-03-12.md'


2025-11-14 17:24:24,300 - INFO - Going to convert document batch...
2025-11-14 17:24:24,301 - INFO - Processing document 4_2025-03-17
2025-11-14 17:24:24,318 - INFO - Finished converting document 4_2025-03-17 in 0.06 sec.
2025-11-14 17:24:24,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:24,358 - INFO - Going to convert document batch...
2025-11-14 17:24:24,358 - INFO - Processing document 4_2025-03-21
2025-11-14 17:24:24,379 - INFO - Finished converting document 4_2025-03-21 in 0.03 sec.
2025-11-14 17:24:24,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:24,421 - INFO - Going to convert document batch...
2025-11-14 17:24:24,421 - INFO - Processing document 4_2025-03-25
2025-11-14 17:24:24,441 - INFO - Finished converting document 4_2025-03-25 in 0.05 sec.
2025-11-14 17:24:24,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:24,485 - INFO - Going to convert document batch...
2025-11-14 17:24:24,486 - 

Converted 'data\edgar_documents\NVDA\4_2025-03-17' --> 'data\processed_data\NVDA\4_2025-03-17.md'
Converted 'data\edgar_documents\NVDA\4_2025-03-21' --> 'data\processed_data\NVDA\4_2025-03-21.md'
Converted 'data\edgar_documents\NVDA\4_2025-03-25' --> 'data\processed_data\NVDA\4_2025-03-25.md'
Converted 'data\edgar_documents\NVDA\4_2025-06-03' --> 'data\processed_data\NVDA\4_2025-06-03.md'


2025-11-14 17:24:24,546 - INFO - Going to convert document batch...
2025-11-14 17:24:24,546 - INFO - Processing document 4_2025-06-04
2025-11-14 17:24:24,575 - INFO - Finished converting document 4_2025-06-04 in 0.06 sec.
2025-11-14 17:24:24,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:24,639 - INFO - Going to convert document batch...
2025-11-14 17:24:24,641 - INFO - Processing document 4_2025-06-10
2025-11-14 17:24:24,665 - INFO - Finished converting document 4_2025-06-10 in 0.05 sec.
2025-11-14 17:24:24,696 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:24,706 - INFO - Going to convert document batch...
2025-11-14 17:24:24,707 - INFO - Processing document 4_2025-06-23
2025-11-14 17:24:24,725 - INFO - Finished converting document 4_2025-06-23 in 0.03 sec.
2025-11-14 17:24:24,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:24,774 - INFO - Going to convert document batch...
2025-11-14 17:24:24,775 - 

Converted 'data\edgar_documents\NVDA\4_2025-06-04' --> 'data\processed_data\NVDA\4_2025-06-04.md'
Converted 'data\edgar_documents\NVDA\4_2025-06-10' --> 'data\processed_data\NVDA\4_2025-06-10.md'
Converted 'data\edgar_documents\NVDA\4_2025-06-23' --> 'data\processed_data\NVDA\4_2025-06-23.md'


2025-11-14 17:24:24,813 - INFO - Finished converting document 4_2025-06-24 in 0.06 sec.
2025-11-14 17:24:24,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:24,890 - INFO - Going to convert document batch...
2025-11-14 17:24:24,891 - INFO - Processing document 4_2025-06-26
2025-11-14 17:24:24,935 - INFO - Finished converting document 4_2025-06-26 in 0.09 sec.
2025-11-14 17:24:25,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:25,016 - INFO - Going to convert document batch...
2025-11-14 17:24:25,017 - INFO - Processing document 4_2025-06-27
2025-11-14 17:24:25,043 - INFO - Finished converting document 4_2025-06-27 in 0.08 sec.


Converted 'data\edgar_documents\NVDA\4_2025-06-24' --> 'data\processed_data\NVDA\4_2025-06-24.md'
Converted 'data\edgar_documents\NVDA\4_2025-06-26' --> 'data\processed_data\NVDA\4_2025-06-26.md'


2025-11-14 17:24:25,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:25,104 - INFO - Going to convert document batch...
2025-11-14 17:24:25,108 - INFO - Processing document 4_2025-06-30
2025-11-14 17:24:25,155 - INFO - Finished converting document 4_2025-06-30 in 0.09 sec.
2025-11-14 17:24:25,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:25,207 - INFO - Going to convert document batch...
2025-11-14 17:24:25,207 - INFO - Processing document 4_2025-07-01


Converted 'data\edgar_documents\NVDA\4_2025-06-27' --> 'data\processed_data\NVDA\4_2025-06-27.md'
Converted 'data\edgar_documents\NVDA\4_2025-06-30' --> 'data\processed_data\NVDA\4_2025-06-30.md'


2025-11-14 17:24:25,465 - INFO - Finished converting document 4_2025-07-01 in 0.30 sec.
2025-11-14 17:24:25,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:25,527 - INFO - Going to convert document batch...
2025-11-14 17:24:25,528 - INFO - Processing document 4_2025-07-07
2025-11-14 17:24:25,577 - INFO - Finished converting document 4_2025-07-07 in 0.08 sec.
2025-11-14 17:24:25,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:25,659 - INFO - Going to convert document batch...
2025-11-14 17:24:25,660 - INFO - Processing document 4_2025-07-10
2025-11-14 17:24:25,698 - INFO - Finished converting document 4_2025-07-10 in 0.08 sec.


Converted 'data\edgar_documents\NVDA\4_2025-07-01' --> 'data\processed_data\NVDA\4_2025-07-01.md'
Converted 'data\edgar_documents\NVDA\4_2025-07-07' --> 'data\processed_data\NVDA\4_2025-07-07.md'


2025-11-14 17:24:25,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:25,761 - INFO - Going to convert document batch...
2025-11-14 17:24:25,761 - INFO - Processing document 4_2025-07-15
2025-11-14 17:24:25,799 - INFO - Finished converting document 4_2025-07-15 in 0.06 sec.
2025-11-14 17:24:25,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:25,862 - INFO - Going to convert document batch...
2025-11-14 17:24:25,863 - INFO - Processing document 4_2025-07-17
2025-11-14 17:24:25,896 - INFO - Finished converting document 4_2025-07-17 in 0.06 sec.
2025-11-14 17:24:25,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\4_2025-07-10' --> 'data\processed_data\NVDA\4_2025-07-10.md'
Converted 'data\edgar_documents\NVDA\4_2025-07-15' --> 'data\processed_data\NVDA\4_2025-07-15.md'
Converted 'data\edgar_documents\NVDA\4_2025-07-17' --> 'data\processed_data\NVDA\4_2025-07-17.md'


2025-11-14 17:24:25,952 - INFO - Going to convert document batch...
2025-11-14 17:24:25,952 - INFO - Processing document 4_2025-07-18
2025-11-14 17:24:25,994 - INFO - Finished converting document 4_2025-07-18 in 0.08 sec.
2025-11-14 17:24:26,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:26,091 - INFO - Going to convert document batch...
2025-11-14 17:24:26,092 - INFO - Processing document 4_2025-07-23
2025-11-14 17:24:26,138 - INFO - Finished converting document 4_2025-07-23 in 0.09 sec.
2025-11-14 17:24:26,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:26,205 - INFO - Going to convert document batch...
2025-11-14 17:24:26,206 - INFO - Processing document 4_2025-07-28
2025-11-14 17:24:26,243 - INFO - Finished converting document 4_2025-07-28 in 0.06 sec.


Converted 'data\edgar_documents\NVDA\4_2025-07-18' --> 'data\processed_data\NVDA\4_2025-07-18.md'
Converted 'data\edgar_documents\NVDA\4_2025-07-23' --> 'data\processed_data\NVDA\4_2025-07-23.md'


2025-11-14 17:24:26,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:26,324 - INFO - Going to convert document batch...
2025-11-14 17:24:26,324 - INFO - Processing document 4_2025-07-31
2025-11-14 17:24:26,376 - INFO - Finished converting document 4_2025-07-31 in 0.09 sec.
2025-11-14 17:24:26,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:26,481 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2025-07-28' --> 'data\processed_data\NVDA\4_2025-07-28.md'
Converted 'data\edgar_documents\NVDA\4_2025-07-31' --> 'data\processed_data\NVDA\4_2025-07-31.md'


2025-11-14 17:24:26,482 - INFO - Processing document 4_2025-08-05
2025-11-14 17:24:26,555 - INFO - Finished converting document 4_2025-08-05 in 0.12 sec.
2025-11-14 17:24:26,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:26,649 - INFO - Going to convert document batch...
2025-11-14 17:24:26,650 - INFO - Processing document 4_2025-08-06
2025-11-14 17:24:26,696 - INFO - Finished converting document 4_2025-08-06 in 0.08 sec.
2025-11-14 17:24:26,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:26,779 - INFO - Going to convert document batch...
2025-11-14 17:24:26,779 - INFO - Processing document 4_2025-08-08


Converted 'data\edgar_documents\NVDA\4_2025-08-05' --> 'data\processed_data\NVDA\4_2025-08-05.md'
Converted 'data\edgar_documents\NVDA\4_2025-08-06' --> 'data\processed_data\NVDA\4_2025-08-06.md'


2025-11-14 17:24:26,821 - INFO - Finished converting document 4_2025-08-08 in 0.08 sec.
2025-11-14 17:24:26,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:26,893 - INFO - Going to convert document batch...
2025-11-14 17:24:26,894 - INFO - Processing document 4_2025-08-13
2025-11-14 17:24:26,964 - INFO - Finished converting document 4_2025-08-13 in 0.11 sec.
2025-11-14 17:24:27,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,035 - INFO - Going to convert document batch...
2025-11-14 17:24:27,036 - INFO - Processing document 4_2025-08-18


Converted 'data\edgar_documents\NVDA\4_2025-08-08' --> 'data\processed_data\NVDA\4_2025-08-08.md'
Converted 'data\edgar_documents\NVDA\4_2025-08-13' --> 'data\processed_data\NVDA\4_2025-08-13.md'


2025-11-14 17:24:27,074 - INFO - Finished converting document 4_2025-08-18 in 0.08 sec.
2025-11-14 17:24:27,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,129 - INFO - Going to convert document batch...
2025-11-14 17:24:27,129 - INFO - Processing document 4_2025-09-03
2025-11-14 17:24:27,154 - INFO - Finished converting document 4_2025-09-03 in 0.05 sec.
2025-11-14 17:24:27,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,220 - INFO - Going to convert document batch...
2025-11-14 17:24:27,221 - INFO - Processing document 4_2025-09-04
2025-11-14 17:24:27,252 - INFO - Finished converting document 4_2025-09-04 in 0.08 sec.
2025-11-14 17:24:27,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,302 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2025-08-18' --> 'data\processed_data\NVDA\4_2025-08-18.md'
Converted 'data\edgar_documents\NVDA\4_2025-09-03' --> 'data\processed_data\NVDA\4_2025-09-03.md'
Converted 'data\edgar_documents\NVDA\4_2025-09-04' --> 'data\processed_data\NVDA\4_2025-09-04.md'


2025-11-14 17:24:27,303 - INFO - Processing document 4_2025-09-08
2025-11-14 17:24:27,345 - INFO - Finished converting document 4_2025-09-08 in 0.08 sec.
2025-11-14 17:24:27,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,421 - INFO - Going to convert document batch...
2025-11-14 17:24:27,422 - INFO - Processing document 4_2025-09-10
2025-11-14 17:24:27,457 - INFO - Finished converting document 4_2025-09-10 in 0.08 sec.
2025-11-14 17:24:27,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,509 - INFO - Going to convert document batch...
2025-11-14 17:24:27,510 - INFO - Processing document 4_2025-09-11
2025-11-14 17:24:27,554 - INFO - Finished converting document 4_2025-09-11 in 0.06 sec.


Converted 'data\edgar_documents\NVDA\4_2025-09-08' --> 'data\processed_data\NVDA\4_2025-09-08.md'
Converted 'data\edgar_documents\NVDA\4_2025-09-10' --> 'data\processed_data\NVDA\4_2025-09-10.md'


2025-11-14 17:24:27,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,614 - INFO - Going to convert document batch...
2025-11-14 17:24:27,616 - INFO - Processing document 4_2025-09-15
2025-11-14 17:24:27,638 - INFO - Finished converting document 4_2025-09-15 in 0.05 sec.
2025-11-14 17:24:27,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,687 - INFO - Going to convert document batch...
2025-11-14 17:24:27,688 - INFO - Processing document 4_2025-09-16
2025-11-14 17:24:27,710 - INFO - Finished converting document 4_2025-09-16 in 0.05 sec.
2025-11-14 17:24:27,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,770 - INFO - Going to convert document batch...
2025-11-14 17:24:27,771 - INFO - Processing document 4_2025-09-19


Converted 'data\edgar_documents\NVDA\4_2025-09-11' --> 'data\processed_data\NVDA\4_2025-09-11.md'
Converted 'data\edgar_documents\NVDA\4_2025-09-15' --> 'data\processed_data\NVDA\4_2025-09-15.md'
Converted 'data\edgar_documents\NVDA\4_2025-09-16' --> 'data\processed_data\NVDA\4_2025-09-16.md'


2025-11-14 17:24:27,794 - INFO - Finished converting document 4_2025-09-19 in 0.06 sec.
2025-11-14 17:24:27,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,844 - INFO - Going to convert document batch...
2025-11-14 17:24:27,845 - INFO - Processing document 4_2025-09-22
2025-11-14 17:24:27,883 - INFO - Finished converting document 4_2025-09-22 in 0.06 sec.
2025-11-14 17:24:27,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:27,933 - INFO - Going to convert document batch...
2025-11-14 17:24:27,933 - INFO - Processing document 4_2025-09-23
2025-11-14 17:24:27,954 - INFO - Finished converting document 4_2025-09-23 in 0.05 sec.
2025-11-14 17:24:27,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:28,010 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2025-09-19' --> 'data\processed_data\NVDA\4_2025-09-19.md'
Converted 'data\edgar_documents\NVDA\4_2025-09-22' --> 'data\processed_data\NVDA\4_2025-09-22.md'
Converted 'data\edgar_documents\NVDA\4_2025-09-23' --> 'data\processed_data\NVDA\4_2025-09-23.md'


2025-11-14 17:24:28,011 - INFO - Processing document 4_2025-09-24
2025-11-14 17:24:28,072 - INFO - Finished converting document 4_2025-09-24 in 0.09 sec.
2025-11-14 17:24:28,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:28,169 - INFO - Going to convert document batch...
2025-11-14 17:24:28,170 - INFO - Processing document 4_2025-09-29


Converted 'data\edgar_documents\NVDA\4_2025-09-24' --> 'data\processed_data\NVDA\4_2025-09-24.md'


2025-11-14 17:24:28,433 - INFO - Finished converting document 4_2025-09-29 in 0.33 sec.
2025-11-14 17:24:28,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:28,512 - INFO - Going to convert document batch...
2025-11-14 17:24:28,513 - INFO - Processing document 4_2025-10-02
2025-11-14 17:24:28,560 - INFO - Finished converting document 4_2025-10-02 in 0.09 sec.
2025-11-14 17:24:28,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:28,654 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2025-09-29' --> 'data\processed_data\NVDA\4_2025-09-29.md'
Converted 'data\edgar_documents\NVDA\4_2025-10-02' --> 'data\processed_data\NVDA\4_2025-10-02.md'


2025-11-14 17:24:28,655 - INFO - Processing document 4_2025-10-07
2025-11-14 17:24:28,709 - INFO - Finished converting document 4_2025-10-07 in 0.11 sec.
2025-11-14 17:24:28,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:28,795 - INFO - Going to convert document batch...
2025-11-14 17:24:28,796 - INFO - Processing document 4_2025-10-10
2025-11-14 17:24:28,852 - INFO - Finished converting document 4_2025-10-10 in 0.08 sec.
2025-11-14 17:24:28,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:28,953 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\NVDA\4_2025-10-07' --> 'data\processed_data\NVDA\4_2025-10-07.md'
Converted 'data\edgar_documents\NVDA\4_2025-10-10' --> 'data\processed_data\NVDA\4_2025-10-10.md'


2025-11-14 17:24:28,954 - INFO - Processing document 4_2025-10-15
2025-11-14 17:24:29,006 - INFO - Finished converting document 4_2025-10-15 in 0.11 sec.
2025-11-14 17:24:29,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,082 - INFO - Going to convert document batch...
2025-11-14 17:24:29,083 - INFO - Processing document 4_2025-10-20
2025-11-14 17:24:29,126 - INFO - Finished converting document 4_2025-10-20 in 0.08 sec.
2025-11-14 17:24:29,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,190 - INFO - Going to convert document batch...
2025-11-14 17:24:29,190 - INFO - Processing document 4_2025-10-23
2025-11-14 17:24:29,222 - INFO - Finished converting document 4_2025-10-23 in 0.06 sec.


Converted 'data\edgar_documents\NVDA\4_2025-10-15' --> 'data\processed_data\NVDA\4_2025-10-15.md'
Converted 'data\edgar_documents\NVDA\4_2025-10-20' --> 'data\processed_data\NVDA\4_2025-10-20.md'
Converted 'data\edgar_documents\NVDA\4_2025-10-23' --> 'data\processed_data\NVDA\4_2025-10-23.md'


2025-11-14 17:24:29,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,306 - INFO - Going to convert document batch...
2025-11-14 17:24:29,307 - INFO - Processing document 4_2025-10-28
2025-11-14 17:24:29,400 - INFO - Finished converting document 4_2025-10-28 in 0.14 sec.
2025-11-14 17:24:29,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,474 - INFO - Going to convert document batch...
2025-11-14 17:24:29,475 - INFO - Processing document 4_2025-10-31
2025-11-14 17:24:29,511 - INFO - Finished converting document 4_2025-10-31 in 0.06 sec.
2025-11-14 17:24:29,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,594 - INFO - Going to convert document batch...
2025-11-14 17:24:29,595 - INFO - Processing document 4_2025-11-05
2025-11-14 17:24:29,639 - INFO - Finished converting document 4_2025-11-05 in 0.09 sec.


Converted 'data\edgar_documents\NVDA\4_2025-10-28' --> 'data\processed_data\NVDA\4_2025-10-28.md'
Converted 'data\edgar_documents\NVDA\4_2025-10-31' --> 'data\processed_data\NVDA\4_2025-10-31.md'


2025-11-14 17:24:29,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,696 - INFO - Going to convert document batch...
2025-11-14 17:24:29,697 - INFO - Processing document 8-K_2023-02-22
2025-11-14 17:24:29,711 - INFO - Finished converting document 8-K_2023-02-22 in 0.03 sec.
2025-11-14 17:24:29,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,753 - INFO - Going to convert document batch...
2025-11-14 17:24:29,754 - INFO - Processing document 8-K_2023-03-08
2025-11-14 17:24:29,794 - INFO - Finished converting document 8-K_2023-03-08 in 0.08 sec.
2025-11-14 17:24:29,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,837 - INFO - Going to convert document batch...
2025-11-14 17:24:29,838 - INFO - Processing document 8-K_2023-05-24
2025-11-14 17:24:29,852 - INFO - Finished converting document 8-K_2023-05-24 in 0.03 sec.


Converted 'data\edgar_documents\NVDA\4_2025-11-05' --> 'data\processed_data\NVDA\4_2025-11-05.md'
Converted 'data\edgar_documents\NVDA\8-K_2023-02-22' --> 'data\processed_data\NVDA\8-K_2023-02-22.md'
Converted 'data\edgar_documents\NVDA\8-K_2023-03-08' --> 'data\processed_data\NVDA\8-K_2023-03-08.md'


2025-11-14 17:24:29,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,893 - INFO - Going to convert document batch...
2025-11-14 17:24:29,894 - INFO - Processing document 8-K_2023-06-27
2025-11-14 17:24:29,930 - INFO - Finished converting document 8-K_2023-06-27 in 0.06 sec.
2025-11-14 17:24:29,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:29,973 - INFO - Going to convert document batch...
2025-11-14 17:24:29,974 - INFO - Processing document 8-K_2023-07-24
2025-11-14 17:24:29,986 - INFO - Finished converting document 8-K_2023-07-24 in 0.05 sec.
2025-11-14 17:24:30,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,014 - INFO - Going to convert document batch...
2025-11-14 17:24:30,015 - INFO - Processing document 8-K_2023-08-23
2025-11-14 17:24:30,027 - INFO - Finished converting document 8-K_2023-08-23 in 0.05 sec.
2025-11-14 17:24:30,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\8-K_2023-05-24' --> 'data\processed_data\NVDA\8-K_2023-05-24.md'
Converted 'data\edgar_documents\NVDA\8-K_2023-06-27' --> 'data\processed_data\NVDA\8-K_2023-06-27.md'
Converted 'data\edgar_documents\NVDA\8-K_2023-07-24' --> 'data\processed_data\NVDA\8-K_2023-07-24.md'
Converted 'data\edgar_documents\NVDA\8-K_2023-08-23' --> 'data\processed_data\NVDA\8-K_2023-08-23.md'


2025-11-14 17:24:30,056 - INFO - Going to convert document batch...
2025-11-14 17:24:30,056 - INFO - Processing document 8-K_2023-10-17
2025-11-14 17:24:30,066 - INFO - Finished converting document 8-K_2023-10-17 in 0.03 sec.
2025-11-14 17:24:30,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,095 - INFO - Going to convert document batch...
2025-11-14 17:24:30,096 - INFO - Processing document 8-K_2023-10-24
2025-11-14 17:24:30,106 - INFO - Finished converting document 8-K_2023-10-24 in 0.03 sec.
2025-11-14 17:24:30,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,135 - INFO - Going to convert document batch...
2025-11-14 17:24:30,135 - INFO - Processing document 8-K_2023-11-21
2025-11-14 17:24:30,147 - INFO - Finished converting document 8-K_2023-11-21 in 0.03 sec.
2025-11-14 17:24:30,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,173 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\NVDA\8-K_2023-10-17' --> 'data\processed_data\NVDA\8-K_2023-10-17.md'
Converted 'data\edgar_documents\NVDA\8-K_2023-10-24' --> 'data\processed_data\NVDA\8-K_2023-10-24.md'
Converted 'data\edgar_documents\NVDA\8-K_2023-11-21' --> 'data\processed_data\NVDA\8-K_2023-11-21.md'
Converted 'data\edgar_documents\NVDA\8-K_2024-02-21' --> 'data\processed_data\NVDA\8-K_2024-02-21.md'


2025-11-14 17:24:30,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,271 - INFO - Going to convert document batch...
2025-11-14 17:24:30,272 - INFO - Processing document 8-K_2024-05-22
2025-11-14 17:24:30,286 - INFO - Finished converting document 8-K_2024-05-22 in 0.03 sec.
2025-11-14 17:24:30,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,335 - INFO - Going to convert document batch...
2025-11-14 17:24:30,335 - INFO - Processing document 8-K_2024-06-07
2025-11-14 17:24:30,349 - INFO - Finished converting document 8-K_2024-06-07 in 0.05 sec.
2025-11-14 17:24:30,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,383 - INFO - Going to convert document batch...
2025-11-14 17:24:30,384 - INFO - Processing document 8-K_2024-07-02
2025-11-14 17:24:30,416 - INFO - Finished converting document 8-K_2024-07-02 in 0.06 sec.


Converted 'data\edgar_documents\NVDA\8-K_2024-03-14' --> 'data\processed_data\NVDA\8-K_2024-03-14.md'
Converted 'data\edgar_documents\NVDA\8-K_2024-05-22' --> 'data\processed_data\NVDA\8-K_2024-05-22.md'
Converted 'data\edgar_documents\NVDA\8-K_2024-06-07' --> 'data\processed_data\NVDA\8-K_2024-06-07.md'


2025-11-14 17:24:30,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,452 - INFO - Going to convert document batch...
2025-11-14 17:24:30,454 - INFO - Processing document 8-K_2024-08-28
2025-11-14 17:24:30,468 - INFO - Finished converting document 8-K_2024-08-28 in 0.03 sec.
2025-11-14 17:24:30,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,495 - INFO - Going to convert document batch...
2025-11-14 17:24:30,496 - INFO - Processing document 8-K_2024-11-07
2025-11-14 17:24:30,507 - INFO - Finished converting document 8-K_2024-11-07 in 0.03 sec.
2025-11-14 17:24:30,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,532 - INFO - Going to convert document batch...
2025-11-14 17:24:30,533 - INFO - Processing document 8-K_2024-11-20
2025-11-14 17:24:30,545 - INFO - Finished converting document 8-K_2024-11-20 in 0.03 sec.
2025-11-14 17:24:30,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\NVDA\8-K_2024-07-02' --> 'data\processed_data\NVDA\8-K_2024-07-02.md'
Converted 'data\edgar_documents\NVDA\8-K_2024-08-28' --> 'data\processed_data\NVDA\8-K_2024-08-28.md'
Converted 'data\edgar_documents\NVDA\8-K_2024-11-07' --> 'data\processed_data\NVDA\8-K_2024-11-07.md'
Converted 'data\edgar_documents\NVDA\8-K_2024-11-20' --> 'data\processed_data\NVDA\8-K_2024-11-20.md'
Converted 'data\edgar_documents\NVDA\8-K_2025-01-17' --> 'data\processed_data\NVDA\8-K_2025-01-17.md'


2025-11-14 17:24:30,636 - INFO - Going to convert document batch...
2025-11-14 17:24:30,637 - INFO - Processing document 8-K_2025-02-26
2025-11-14 17:24:30,650 - INFO - Finished converting document 8-K_2025-02-26 in 0.03 sec.
2025-11-14 17:24:30,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,679 - INFO - Going to convert document batch...
2025-11-14 17:24:30,680 - INFO - Processing document 8-K_2025-03-07
2025-11-14 17:24:30,704 - INFO - Finished converting document 8-K_2025-03-07 in 0.05 sec.
2025-11-14 17:24:30,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,763 - INFO - Going to convert document batch...
2025-11-14 17:24:30,764 - INFO - Processing document 8-K_2025-04-15
2025-11-14 17:24:30,774 - INFO - Finished converting document 8-K_2025-04-15 in 0.05 sec.
2025-11-14 17:24:30,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,798 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\NVDA\8-K_2025-02-26' --> 'data\processed_data\NVDA\8-K_2025-02-26.md'
Converted 'data\edgar_documents\NVDA\8-K_2025-03-07' --> 'data\processed_data\NVDA\8-K_2025-03-07.md'
Converted 'data\edgar_documents\NVDA\8-K_2025-04-15' --> 'data\processed_data\NVDA\8-K_2025-04-15.md'
Converted 'data\edgar_documents\NVDA\8-K_2025-05-28' --> 'data\processed_data\NVDA\8-K_2025-05-28.md'


2025-11-14 17:24:30,852 - INFO - Processing document 8-K_2025-07-01
2025-11-14 17:24:30,893 - INFO - Finished converting document 8-K_2025-07-01 in 0.08 sec.
2025-11-14 17:24:30,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,953 - INFO - Going to convert document batch...
2025-11-14 17:24:30,953 - INFO - Processing document 8-K_2025-08-05
2025-11-14 17:24:30,965 - INFO - Finished converting document 8-K_2025-08-05 in 0.06 sec.
2025-11-14 17:24:30,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:24:30,989 - INFO - Going to convert document batch...
2025-11-14 17:24:30,990 - INFO - Processing document 8-K_2025-08-27
2025-11-14 17:24:31,004 - INFO - Finished converting document 8-K_2025-08-27 in 0.03 sec.
2025-11-14 17:24:31,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\8-K_2025-07-01' --> 'data\processed_data\NVDA\8-K_2025-07-01.md'
Converted 'data\edgar_documents\NVDA\8-K_2025-08-05' --> 'data\processed_data\NVDA\8-K_2025-08-05.md'
Converted 'data\edgar_documents\NVDA\8-K_2025-08-27' --> 'data\processed_data\NVDA\8-K_2025-08-27.md'


2025-11-14 17:24:31,615 - INFO - Going to convert document batch...
2025-11-14 17:24:31,615 - INFO - Processing document DEF-14A_2023-05-08
2025-11-14 17:24:32,711 - INFO - Finished converting document DEF-14A_2023-05-08 in 1.69 sec.
2025-11-14 17:24:33,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\DEF-14A_2023-05-08' --> 'data\processed_data\NVDA\DEF-14A_2023-05-08.md'


2025-11-14 17:24:33,756 - INFO - Going to convert document batch...
2025-11-14 17:24:33,758 - INFO - Processing document DEF-14A_2024-05-14
2025-11-14 17:24:35,009 - INFO - Finished converting document DEF-14A_2024-05-14 in 1.58 sec.
2025-11-14 17:24:35,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\DEF-14A_2024-05-14' --> 'data\processed_data\NVDA\DEF-14A_2024-05-14.md'


2025-11-14 17:24:35,997 - INFO - Going to convert document batch...
2025-11-14 17:24:35,998 - INFO - Processing document DEF-14A_2025-05-13
2025-11-14 17:24:36,930 - INFO - Finished converting document DEF-14A_2025-05-13 in 1.28 sec.
2025-11-14 17:24:37,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\NVDA\DEF-14A_2025-05-13' --> 'data\processed_data\NVDA\DEF-14A_2025-05-13.md'
Processed 187 new files. Errors: 0
Found 132 files to process in data\edgar_documents\ORCL


2025-11-14 17:24:39,590 - INFO - Going to convert document batch...
2025-11-14 17:24:39,591 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:24:39,591 - INFO - Processing document 10-K_2023-06-20
2025-11-14 17:24:43,145 - INFO - Finished converting document 10-K_2023-06-20 in 5.55 sec.
2025-11-14 17:24:43,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\10-K_2023-06-20' --> 'data\processed_data\ORCL\10-K_2023-06-20.md'


2025-11-14 17:24:45,252 - INFO - Going to convert document batch...
2025-11-14 17:24:45,253 - INFO - Processing document 10-K_2024-06-20
2025-11-14 17:24:48,692 - INFO - Finished converting document 10-K_2024-06-20 in 5.09 sec.
2025-11-14 17:24:49,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\10-K_2024-06-20' --> 'data\processed_data\ORCL\10-K_2024-06-20.md'


2025-11-14 17:24:51,059 - INFO - Going to convert document batch...
2025-11-14 17:24:51,060 - INFO - Processing document 10-K_2025-06-18
2025-11-14 17:24:54,150 - INFO - Finished converting document 10-K_2025-06-18 in 5.00 sec.
2025-11-14 17:24:54,654 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:24:54,656 - ERROR - Input document 10-Q_2023-03-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:24:54,663 - INFO - Going to convert d

Converted 'data\edgar_documents\ORCL\10-K_2025-06-18' --> 'data\processed_data\ORCL\10-K_2025-06-18.md'
Error processing data\edgar_documents\ORCL\10-Q_2023-03-10: File format not allowed: data\edgar_documents\ORCL\10-Q_2023-03-10


2025-11-14 17:24:55,716 - INFO - Going to convert document batch...
2025-11-14 17:24:55,716 - INFO - Processing document 10-Q_2023-09-12
2025-11-14 17:24:56,476 - INFO - Finished converting document 10-Q_2023-09-12 in 1.81 sec.
2025-11-14 17:24:56,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\10-Q_2023-09-12' --> 'data\processed_data\ORCL\10-Q_2023-09-12.md'


2025-11-14 17:24:57,388 - INFO - Going to convert document batch...
2025-11-14 17:24:57,389 - INFO - Processing document 10-Q_2023-12-12
2025-11-14 17:24:59,031 - INFO - Finished converting document 10-Q_2023-12-12 in 2.36 sec.
2025-11-14 17:24:59,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\10-Q_2023-12-12' --> 'data\processed_data\ORCL\10-Q_2023-12-12.md'


2025-11-14 17:25:00,001 - INFO - Going to convert document batch...
2025-11-14 17:25:00,002 - INFO - Processing document 10-Q_2024-03-12
2025-11-14 17:25:01,119 - INFO - Finished converting document 10-Q_2024-03-12 in 1.83 sec.
2025-11-14 17:25:01,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\10-Q_2024-03-12' --> 'data\processed_data\ORCL\10-Q_2024-03-12.md'


2025-11-14 17:25:02,291 - INFO - Going to convert document batch...
2025-11-14 17:25:02,291 - INFO - Processing document 10-Q_2024-09-10
2025-11-14 17:25:03,033 - INFO - Finished converting document 10-Q_2024-09-10 in 1.61 sec.
2025-11-14 17:25:03,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\10-Q_2024-09-10' --> 'data\processed_data\ORCL\10-Q_2024-09-10.md'


2025-11-14 17:25:04,406 - INFO - Going to convert document batch...
2025-11-14 17:25:04,406 - INFO - Processing document 10-Q_2024-12-10
2025-11-14 17:25:05,491 - INFO - Finished converting document 10-Q_2024-12-10 in 2.25 sec.
2025-11-14 17:25:05,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\10-Q_2024-12-10' --> 'data\processed_data\ORCL\10-Q_2024-12-10.md'


2025-11-14 17:25:06,865 - INFO - Going to convert document batch...
2025-11-14 17:25:06,866 - INFO - Processing document 10-Q_2025-03-11
2025-11-14 17:25:07,968 - INFO - Finished converting document 10-Q_2025-03-11 in 2.16 sec.
2025-11-14 17:25:08,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\10-Q_2025-03-11' --> 'data\processed_data\ORCL\10-Q_2025-03-11.md'


2025-11-14 17:25:08,811 - INFO - Going to convert document batch...
2025-11-14 17:25:08,811 - INFO - Processing document 10-Q_2025-09-10
2025-11-14 17:25:09,585 - INFO - Finished converting document 10-Q_2025-09-10 in 1.30 sec.
2025-11-14 17:25:09,793 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:09,802 - INFO - Going to convert document batch...
2025-11-14 17:25:09,803 - INFO - Processing document 4_2023-01-26
2025-11-14 17:25:09,823 - INFO - Finished converting document 4_2023-01-26 in 0.05 sec.
2025-11-14 17:25:09,864 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:09,864 - ERROR - Input document 4_2023-02-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, 

Converted 'data\edgar_documents\ORCL\10-Q_2025-09-10' --> 'data\processed_data\ORCL\10-Q_2025-09-10.md'
Converted 'data\edgar_documents\ORCL\4_2023-01-26' --> 'data\processed_data\ORCL\4_2023-01-26.md'
Error processing data\edgar_documents\ORCL\4_2023-02-02: File format not allowed: data\edgar_documents\ORCL\4_2023-02-02
Error processing data\edgar_documents\ORCL\4_2023-02-03: File format not allowed: data\edgar_documents\ORCL\4_2023-02-03
Converted 'data\edgar_documents\ORCL\4_2023-02-06' --> 'data\processed_data\ORCL\4_2023-02-06.md'


2025-11-14 17:25:09,968 - INFO - Processing document 4_2023-03-22
2025-11-14 17:25:09,989 - INFO - Finished converting document 4_2023-03-22 in 0.05 sec.
2025-11-14 17:25:10,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:10,041 - INFO - Going to convert document batch...
2025-11-14 17:25:10,042 - INFO - Processing document 4_2023-04-04
2025-11-14 17:25:10,080 - INFO - Finished converting document 4_2023-04-04 in 0.06 sec.
2025-11-14 17:25:10,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:10,142 - INFO - Going to convert document batch...
2025-11-14 17:25:10,143 - INFO - Processing document 4_2023-04-12
2025-11-14 17:25:10,172 - INFO - Finished converting document 4_2023-04-12 in 0.05 sec.


Converted 'data\edgar_documents\ORCL\4_2023-03-22' --> 'data\processed_data\ORCL\4_2023-03-22.md'
Converted 'data\edgar_documents\ORCL\4_2023-04-04' --> 'data\processed_data\ORCL\4_2023-04-04.md'


2025-11-14 17:25:10,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:10,221 - INFO - Going to convert document batch...
2025-11-14 17:25:10,222 - INFO - Processing document 4_2023-04-13
2025-11-14 17:25:10,248 - INFO - Finished converting document 4_2023-04-13 in 0.05 sec.
2025-11-14 17:25:10,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:10,298 - INFO - Going to convert document batch...
2025-11-14 17:25:10,299 - INFO - Processing document 4_2023-04-25
2025-11-14 17:25:10,320 - INFO - Finished converting document 4_2023-04-25 in 0.03 sec.
2025-11-14 17:25:10,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:10,371 - INFO - Going to convert document batch...
2025-11-14 17:25:10,374 - INFO - Processing document 4_2023-06-02
2025-11-14 17:25:10,399 - INFO - Finished converting document 4_2023-06-02 in 0.05 sec.


Converted 'data\edgar_documents\ORCL\4_2023-04-12' --> 'data\processed_data\ORCL\4_2023-04-12.md'
Converted 'data\edgar_documents\ORCL\4_2023-04-13' --> 'data\processed_data\ORCL\4_2023-04-13.md'
Converted 'data\edgar_documents\ORCL\4_2023-04-25' --> 'data\processed_data\ORCL\4_2023-04-25.md'


2025-11-14 17:25:10,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:10,450 - INFO - Going to convert document batch...
2025-11-14 17:25:10,452 - INFO - Processing document 4_2023-06-16
2025-11-14 17:25:10,478 - INFO - Finished converting document 4_2023-06-16 in 0.05 sec.
2025-11-14 17:25:10,540 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:10,563 - INFO - Going to convert document batch...
2025-11-14 17:25:10,564 - INFO - Processing document 4_2023-06-21
2025-11-14 17:25:10,600 - INFO - Finished converting document 4_2023-06-21 in 0.08 sec.


Converted 'data\edgar_documents\ORCL\4_2023-06-02' --> 'data\processed_data\ORCL\4_2023-06-02.md'
Converted 'data\edgar_documents\ORCL\4_2023-06-16' --> 'data\processed_data\ORCL\4_2023-06-16.md'


2025-11-14 17:25:10,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:10,661 - INFO - Going to convert document batch...
2025-11-14 17:25:10,662 - INFO - Processing document 4_2023-06-22


Converted 'data\edgar_documents\ORCL\4_2023-06-21' --> 'data\processed_data\ORCL\4_2023-06-21.md'


2025-11-14 17:25:11,218 - INFO - Finished converting document 4_2023-06-22 in 0.59 sec.
2025-11-14 17:25:11,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,275 - INFO - Going to convert document batch...
2025-11-14 17:25:11,276 - INFO - Processing document 4_2023-06-23
2025-11-14 17:25:11,301 - INFO - Finished converting document 4_2023-06-23 in 0.05 sec.
2025-11-14 17:25:11,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,354 - INFO - Going to convert document batch...
2025-11-14 17:25:11,354 - INFO - Processing document 4_2023-06-29
2025-11-14 17:25:11,376 - INFO - Finished converting document 4_2023-06-29 in 0.05 sec.
2025-11-14 17:25:11,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,420 - INFO - Going to convert document batch...
2025-11-14 17:25:11,420 - INFO - Processing document 4_2023-06-30
2025-11-14 17:25:11,438 - INFO - Finished converting document 4_2023-06-30 in 0.03 sec.


Converted 'data\edgar_documents\ORCL\4_2023-06-22' --> 'data\processed_data\ORCL\4_2023-06-22.md'
Converted 'data\edgar_documents\ORCL\4_2023-06-23' --> 'data\processed_data\ORCL\4_2023-06-23.md'
Converted 'data\edgar_documents\ORCL\4_2023-06-29' --> 'data\processed_data\ORCL\4_2023-06-29.md'


2025-11-14 17:25:11,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,483 - INFO - Going to convert document batch...
2025-11-14 17:25:11,484 - INFO - Processing document 4_2023-07-07
2025-11-14 17:25:11,505 - INFO - Finished converting document 4_2023-07-07 in 0.03 sec.
2025-11-14 17:25:11,560 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,570 - INFO - Going to convert document batch...
2025-11-14 17:25:11,571 - INFO - Processing document 4_2023-07-28
2025-11-14 17:25:11,596 - INFO - Finished converting document 4_2023-07-28 in 0.06 sec.
2025-11-14 17:25:11,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,642 - INFO - Going to convert document batch...
2025-11-14 17:25:11,643 - INFO - Processing document 4_2023-08-07
2025-11-14 17:25:11,667 - INFO - Finished converting document 4_2023-08-07 in 0.06 sec.


Converted 'data\edgar_documents\ORCL\4_2023-06-30' --> 'data\processed_data\ORCL\4_2023-06-30.md'
Converted 'data\edgar_documents\ORCL\4_2023-07-07' --> 'data\processed_data\ORCL\4_2023-07-07.md'
Converted 'data\edgar_documents\ORCL\4_2023-07-28' --> 'data\processed_data\ORCL\4_2023-07-28.md'


2025-11-14 17:25:11,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,709 - INFO - Going to convert document batch...
2025-11-14 17:25:11,710 - INFO - Processing document 4_2023-09-06
2025-11-14 17:25:11,731 - INFO - Finished converting document 4_2023-09-06 in 0.05 sec.
2025-11-14 17:25:11,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,786 - INFO - Going to convert document batch...
2025-11-14 17:25:11,787 - INFO - Processing document 4_2023-09-18
2025-11-14 17:25:11,806 - INFO - Finished converting document 4_2023-09-18 in 0.05 sec.
2025-11-14 17:25:11,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,845 - INFO - Going to convert document batch...
2025-11-14 17:25:11,846 - INFO - Processing document 4_2023-09-22
2025-11-14 17:25:11,868 - INFO - Finished converting document 4_2023-09-22 in 0.03 sec.


Converted 'data\edgar_documents\ORCL\4_2023-08-07' --> 'data\processed_data\ORCL\4_2023-08-07.md'
Converted 'data\edgar_documents\ORCL\4_2023-09-06' --> 'data\processed_data\ORCL\4_2023-09-06.md'
Converted 'data\edgar_documents\ORCL\4_2023-09-18' --> 'data\processed_data\ORCL\4_2023-09-18.md'
Converted 'data\edgar_documents\ORCL\4_2023-09-22' --> 'data\processed_data\ORCL\4_2023-09-22.md'


2025-11-14 17:25:11,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:11,927 - INFO - Going to convert document batch...
2025-11-14 17:25:11,928 - INFO - Processing document 4_2023-10-06
2025-11-14 17:25:11,948 - INFO - Finished converting document 4_2023-10-06 in 0.06 sec.
2025-11-14 17:25:12,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,030 - INFO - Going to convert document batch...
2025-11-14 17:25:12,030 - INFO - Processing document 4_2023-10-30
2025-11-14 17:25:12,051 - INFO - Finished converting document 4_2023-10-30 in 0.06 sec.
2025-11-14 17:25:12,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,090 - INFO - Going to convert document batch...
2025-11-14 17:25:12,091 - INFO - Processing document 4_2023-11-13
2025-11-14 17:25:12,111 - INFO - Finished converting document 4_2023-11-13 in 0.05 sec.
2025-11-14 17:25:12,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\ORCL\4_2023-10-06' --> 'data\processed_data\ORCL\4_2023-10-06.md'
Converted 'data\edgar_documents\ORCL\4_2023-10-30' --> 'data\processed_data\ORCL\4_2023-10-30.md'
Converted 'data\edgar_documents\ORCL\4_2023-11-13' --> 'data\processed_data\ORCL\4_2023-11-13.md'


2025-11-14 17:25:12,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,211 - INFO - Going to convert document batch...
2025-11-14 17:25:12,212 - INFO - Processing document 4_2023-12-21
2025-11-14 17:25:12,231 - INFO - Finished converting document 4_2023-12-21 in 0.05 sec.
2025-11-14 17:25:12,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,289 - INFO - Going to convert document batch...
2025-11-14 17:25:12,290 - INFO - Processing document 4_2023-12-22
2025-11-14 17:25:12,333 - INFO - Finished converting document 4_2023-12-22 in 0.08 sec.
2025-11-14 17:25:12,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,375 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ORCL\4_2023-12-05' --> 'data\processed_data\ORCL\4_2023-12-05.md'
Converted 'data\edgar_documents\ORCL\4_2023-12-21' --> 'data\processed_data\ORCL\4_2023-12-21.md'
Converted 'data\edgar_documents\ORCL\4_2023-12-22' --> 'data\processed_data\ORCL\4_2023-12-22.md'


2025-11-14 17:25:12,376 - INFO - Processing document 4_2024-01-26
2025-11-14 17:25:12,394 - INFO - Finished converting document 4_2024-01-26 in 0.03 sec.
2025-11-14 17:25:12,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,446 - INFO - Going to convert document batch...
2025-11-14 17:25:12,448 - INFO - Processing document 4_2024-03-14
2025-11-14 17:25:12,477 - INFO - Finished converting document 4_2024-03-14 in 0.05 sec.
2025-11-14 17:25:12,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,545 - INFO - Going to convert document batch...
2025-11-14 17:25:12,546 - INFO - Processing document 4_2024-03-19
2025-11-14 17:25:12,569 - INFO - Finished converting document 4_2024-03-19 in 0.06 sec.
2025-11-14 17:25:12,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\4_2024-01-26' --> 'data\processed_data\ORCL\4_2024-01-26.md'
Converted 'data\edgar_documents\ORCL\4_2024-03-14' --> 'data\processed_data\ORCL\4_2024-03-14.md'
Converted 'data\edgar_documents\ORCL\4_2024-03-19' --> 'data\processed_data\ORCL\4_2024-03-19.md'


2025-11-14 17:25:12,625 - INFO - Going to convert document batch...
2025-11-14 17:25:12,626 - INFO - Processing document 4_2024-03-27
2025-11-14 17:25:12,669 - INFO - Finished converting document 4_2024-03-27 in 0.08 sec.
2025-11-14 17:25:12,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,753 - INFO - Going to convert document batch...
2025-11-14 17:25:12,753 - INFO - Processing document 4_2024-04-26
2025-11-14 17:25:12,775 - INFO - Finished converting document 4_2024-04-26 in 0.05 sec.
2025-11-14 17:25:12,826 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,840 - INFO - Going to convert document batch...
2025-11-14 17:25:12,841 - INFO - Processing document 4_2024-05-02
2025-11-14 17:25:12,865 - INFO - Finished converting document 4_2024-05-02 in 0.06 sec.
2025-11-14 17:25:12,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,906 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ORCL\4_2024-03-27' --> 'data\processed_data\ORCL\4_2024-03-27.md'
Converted 'data\edgar_documents\ORCL\4_2024-04-26' --> 'data\processed_data\ORCL\4_2024-04-26.md'
Converted 'data\edgar_documents\ORCL\4_2024-05-02' --> 'data\processed_data\ORCL\4_2024-05-02.md'


2025-11-14 17:25:12,907 - INFO - Processing document 4_2024-05-06
2025-11-14 17:25:12,928 - INFO - Finished converting document 4_2024-05-06 in 0.03 sec.
2025-11-14 17:25:12,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:12,984 - INFO - Going to convert document batch...
2025-11-14 17:25:12,985 - INFO - Processing document 4_2024-05-08
2025-11-14 17:25:13,025 - INFO - Finished converting document 4_2024-05-08 in 0.06 sec.
2025-11-14 17:25:13,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,091 - INFO - Going to convert document batch...
2025-11-14 17:25:13,092 - INFO - Processing document 4_2024-06-03
2025-11-14 17:25:13,113 - INFO - Finished converting document 4_2024-06-03 in 0.06 sec.
2025-11-14 17:25:13,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\4_2024-05-06' --> 'data\processed_data\ORCL\4_2024-05-06.md'
Converted 'data\edgar_documents\ORCL\4_2024-05-08' --> 'data\processed_data\ORCL\4_2024-05-08.md'
Converted 'data\edgar_documents\ORCL\4_2024-06-03' --> 'data\processed_data\ORCL\4_2024-06-03.md'


2025-11-14 17:25:13,164 - INFO - Going to convert document batch...
2025-11-14 17:25:13,165 - INFO - Processing document 4_2024-06-21
2025-11-14 17:25:13,187 - INFO - Finished converting document 4_2024-06-21 in 0.05 sec.
2025-11-14 17:25:13,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,235 - INFO - Going to convert document batch...
2025-11-14 17:25:13,236 - INFO - Processing document 4_2024-06-24
2025-11-14 17:25:13,262 - INFO - Finished converting document 4_2024-06-24 in 0.06 sec.
2025-11-14 17:25:13,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,307 - INFO - Going to convert document batch...
2025-11-14 17:25:13,308 - INFO - Processing document 4_2024-06-27
2025-11-14 17:25:13,329 - INFO - Finished converting document 4_2024-06-27 in 0.05 sec.
2025-11-14 17:25:13,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,370 - INFO - Going to convert document batch...
2025-11-14 17:25:13,371 - 

Converted 'data\edgar_documents\ORCL\4_2024-06-21' --> 'data\processed_data\ORCL\4_2024-06-21.md'
Converted 'data\edgar_documents\ORCL\4_2024-06-24' --> 'data\processed_data\ORCL\4_2024-06-24.md'
Converted 'data\edgar_documents\ORCL\4_2024-06-27' --> 'data\processed_data\ORCL\4_2024-06-27.md'


2025-11-14 17:25:13,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,429 - INFO - Going to convert document batch...
2025-11-14 17:25:13,430 - INFO - Processing document 4_2024-07-11
2025-11-14 17:25:13,456 - INFO - Finished converting document 4_2024-07-11 in 0.05 sec.
2025-11-14 17:25:13,490 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,504 - INFO - Going to convert document batch...
2025-11-14 17:25:13,505 - INFO - Processing document 4_2024-07-17
2025-11-14 17:25:13,544 - INFO - Finished converting document 4_2024-07-17 in 0.08 sec.


Converted 'data\edgar_documents\ORCL\4_2024-06-28' --> 'data\processed_data\ORCL\4_2024-06-28.md'
Converted 'data\edgar_documents\ORCL\4_2024-07-11' --> 'data\processed_data\ORCL\4_2024-07-11.md'


2025-11-14 17:25:13,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,617 - INFO - Going to convert document batch...
2025-11-14 17:25:13,618 - INFO - Processing document 4_2024-07-19
2025-11-14 17:25:13,640 - INFO - Finished converting document 4_2024-07-19 in 0.05 sec.
2025-11-14 17:25:13,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,701 - INFO - Going to convert document batch...
2025-11-14 17:25:13,702 - INFO - Processing document 4_2024-07-26
2025-11-14 17:25:13,724 - INFO - Finished converting document 4_2024-07-26 in 0.05 sec.
2025-11-14 17:25:13,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,774 - INFO - Going to convert document batch...
2025-11-14 17:25:13,775 - INFO - Processing document 4_2024-08-07
2025-11-14 17:25:13,803 - INFO - Finished converting document 4_2024-08-07 in 0.05 sec.


Converted 'data\edgar_documents\ORCL\4_2024-07-17' --> 'data\processed_data\ORCL\4_2024-07-17.md'
Converted 'data\edgar_documents\ORCL\4_2024-07-19' --> 'data\processed_data\ORCL\4_2024-07-19.md'
Converted 'data\edgar_documents\ORCL\4_2024-07-26' --> 'data\processed_data\ORCL\4_2024-07-26.md'


2025-11-14 17:25:13,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,852 - INFO - Going to convert document batch...
2025-11-14 17:25:13,853 - INFO - Processing document 4_2024-09-06
2025-11-14 17:25:13,879 - INFO - Finished converting document 4_2024-09-06 in 0.05 sec.
2025-11-14 17:25:13,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:13,937 - INFO - Going to convert document batch...
2025-11-14 17:25:13,938 - INFO - Processing document 4_2024-09-17
2025-11-14 17:25:13,963 - INFO - Finished converting document 4_2024-09-17 in 0.05 sec.
2025-11-14 17:25:13,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:14,007 - INFO - Going to convert document batch...
2025-11-14 17:25:14,007 - INFO - Processing document 4_2024-09-23


Converted 'data\edgar_documents\ORCL\4_2024-08-07' --> 'data\processed_data\ORCL\4_2024-08-07.md'
Converted 'data\edgar_documents\ORCL\4_2024-09-06' --> 'data\processed_data\ORCL\4_2024-09-06.md'
Converted 'data\edgar_documents\ORCL\4_2024-09-17' --> 'data\processed_data\ORCL\4_2024-09-17.md'


2025-11-14 17:25:14,032 - INFO - Finished converting document 4_2024-09-23 in 0.05 sec.
2025-11-14 17:25:14,076 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:14,076 - ERROR - Input document 4_2024-09-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:25:14,078 - INFO - Going to convert document batch...
2025-11-14 17:25:14,101 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:14,101 - ERROR - Input document 4_2024-09-26 with forma

Converted 'data\edgar_documents\ORCL\4_2024-09-23' --> 'data\processed_data\ORCL\4_2024-09-23.md'
Error processing data\edgar_documents\ORCL\4_2024-09-25: File format not allowed: data\edgar_documents\ORCL\4_2024-09-25
Error processing data\edgar_documents\ORCL\4_2024-09-26: File format not allowed: data\edgar_documents\ORCL\4_2024-09-26
Converted 'data\edgar_documents\ORCL\4_2024-10-08' --> 'data\processed_data\ORCL\4_2024-10-08.md'
Converted 'data\edgar_documents\ORCL\4_2024-10-28' --> 'data\processed_data\ORCL\4_2024-10-28.md'


2025-11-14 17:25:14,245 - INFO - Going to convert document batch...
2025-11-14 17:25:14,246 - INFO - Processing document 4_2024-10-29
2025-11-14 17:25:14,265 - INFO - Finished converting document 4_2024-10-29 in 0.05 sec.
2025-11-14 17:25:14,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:14,309 - INFO - Going to convert document batch...
2025-11-14 17:25:14,310 - INFO - Processing document 4_2024-11-12
2025-11-14 17:25:14,328 - INFO - Finished converting document 4_2024-11-12 in 0.05 sec.
2025-11-14 17:25:14,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:14,399 - INFO - Going to convert document batch...
2025-11-14 17:25:14,401 - INFO - Processing document 4_2024-12-09
2025-11-14 17:25:14,424 - INFO - Finished converting document 4_2024-12-09 in 0.06 sec.
2025-11-14 17:25:14,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:14,477 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ORCL\4_2024-10-29' --> 'data\processed_data\ORCL\4_2024-10-29.md'
Converted 'data\edgar_documents\ORCL\4_2024-11-12' --> 'data\processed_data\ORCL\4_2024-11-12.md'
Converted 'data\edgar_documents\ORCL\4_2024-12-09' --> 'data\processed_data\ORCL\4_2024-12-09.md'


2025-11-14 17:25:14,477 - INFO - Processing document 4_2025-01-24
2025-11-14 17:25:14,523 - INFO - Finished converting document 4_2025-01-24 in 0.08 sec.
2025-11-14 17:25:14,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:14,580 - INFO - Going to convert document batch...
2025-11-14 17:25:14,580 - INFO - Processing document 4_2025-01-27
2025-11-14 17:25:14,603 - INFO - Finished converting document 4_2025-01-27 in 0.03 sec.
2025-11-14 17:25:14,644 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:14,645 - ERROR - Input document 4_2025-01-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\ORCL\4_2025-01-24' --> 'data\processed_data\ORCL\4_2025-01-24.md'
Converted 'data\edgar_documents\ORCL\4_2025-01-27' --> 'data\processed_data\ORCL\4_2025-01-27.md'
Error processing data\edgar_documents\ORCL\4_2025-01-30: File format not allowed: data\edgar_documents\ORCL\4_2025-01-30
Error processing data\edgar_documents\ORCL\4_2025-01-31: File format not allowed: data\edgar_documents\ORCL\4_2025-01-31
Converted 'data\edgar_documents\ORCL\4_2025-02-14' --> 'data\processed_data\ORCL\4_2025-02-14.md'


2025-11-14 17:25:14,750 - INFO - Processing document 4_2025-03-21
2025-11-14 17:25:14,773 - INFO - Finished converting document 4_2025-03-21 in 0.05 sec.
2025-11-14 17:25:14,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:14,817 - INFO - Going to convert document batch...
2025-11-14 17:25:14,818 - INFO - Processing document 4_2025-04-04
2025-11-14 17:25:14,850 - INFO - Finished converting document 4_2025-04-04 in 0.05 sec.
2025-11-14 17:25:14,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:14,917 - INFO - Going to convert document batch...
2025-11-14 17:25:14,918 - INFO - Processing document 4_2025-04-15
2025-11-14 17:25:14,938 - INFO - Finished converting document 4_2025-04-15 in 0.06 sec.
2025-11-14 17:25:14,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:14,981 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ORCL\4_2025-03-21' --> 'data\processed_data\ORCL\4_2025-03-21.md'
Converted 'data\edgar_documents\ORCL\4_2025-04-04' --> 'data\processed_data\ORCL\4_2025-04-04.md'
Converted 'data\edgar_documents\ORCL\4_2025-04-15' --> 'data\processed_data\ORCL\4_2025-04-15.md'


2025-11-14 17:25:14,981 - INFO - Processing document 4_2025-04-18
2025-11-14 17:25:15,002 - INFO - Finished converting document 4_2025-04-18 in 0.05 sec.
2025-11-14 17:25:15,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,043 - INFO - Going to convert document batch...
2025-11-14 17:25:15,044 - INFO - Processing document 4_2025-04-23
2025-11-14 17:25:15,062 - INFO - Finished converting document 4_2025-04-23 in 0.05 sec.
2025-11-14 17:25:15,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,102 - INFO - Going to convert document batch...
2025-11-14 17:25:15,103 - INFO - Processing document 4_2025-04-25


Converted 'data\edgar_documents\ORCL\4_2025-04-18' --> 'data\processed_data\ORCL\4_2025-04-18.md'
Converted 'data\edgar_documents\ORCL\4_2025-04-23' --> 'data\processed_data\ORCL\4_2025-04-23.md'


2025-11-14 17:25:15,337 - INFO - Finished converting document 4_2025-04-25 in 0.25 sec.
2025-11-14 17:25:15,370 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,378 - INFO - Going to convert document batch...
2025-11-14 17:25:15,379 - INFO - Processing document 4_2025-05-06
2025-11-14 17:25:15,406 - INFO - Finished converting document 4_2025-05-06 in 0.05 sec.
2025-11-14 17:25:15,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,446 - INFO - Going to convert document batch...
2025-11-14 17:25:15,447 - INFO - Processing document 4_2025-05-16
2025-11-14 17:25:15,466 - INFO - Finished converting document 4_2025-05-16 in 0.05 sec.
2025-11-14 17:25:15,496 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,506 - INFO - Going to convert document batch...
2025-11-14 17:25:15,507 - INFO - Processing document 4_2025-06-03
2025-11-14 17:25:15,529 - INFO - Finished converting document 4_2025-06-03 in 0.05 sec.


Converted 'data\edgar_documents\ORCL\4_2025-04-25' --> 'data\processed_data\ORCL\4_2025-04-25.md'
Converted 'data\edgar_documents\ORCL\4_2025-05-06' --> 'data\processed_data\ORCL\4_2025-05-06.md'
Converted 'data\edgar_documents\ORCL\4_2025-05-16' --> 'data\processed_data\ORCL\4_2025-05-16.md'


2025-11-14 17:25:15,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,574 - INFO - Going to convert document batch...
2025-11-14 17:25:15,575 - INFO - Processing document 4_2025-06-13
2025-11-14 17:25:15,612 - INFO - Finished converting document 4_2025-06-13 in 0.06 sec.
2025-11-14 17:25:15,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,669 - INFO - Going to convert document batch...
2025-11-14 17:25:15,670 - INFO - Processing document 4_2025-06-20
2025-11-14 17:25:15,688 - INFO - Finished converting document 4_2025-06-20 in 0.03 sec.
2025-11-14 17:25:15,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,741 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ORCL\4_2025-06-03' --> 'data\processed_data\ORCL\4_2025-06-03.md'
Converted 'data\edgar_documents\ORCL\4_2025-06-13' --> 'data\processed_data\ORCL\4_2025-06-13.md'
Converted 'data\edgar_documents\ORCL\4_2025-06-20' --> 'data\processed_data\ORCL\4_2025-06-20.md'


2025-11-14 17:25:15,741 - INFO - Processing document 4_2025-06-24
2025-11-14 17:25:15,793 - INFO - Finished converting document 4_2025-06-24 in 0.09 sec.
2025-11-14 17:25:15,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,880 - INFO - Going to convert document batch...
2025-11-14 17:25:15,881 - INFO - Processing document 4_2025-06-25
2025-11-14 17:25:15,902 - INFO - Finished converting document 4_2025-06-25 in 0.06 sec.
2025-11-14 17:25:15,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:15,953 - INFO - Going to convert document batch...
2025-11-14 17:25:15,954 - INFO - Processing document 4_2025-06-26
2025-11-14 17:25:15,995 - INFO - Finished converting document 4_2025-06-26 in 0.08 sec.


Converted 'data\edgar_documents\ORCL\4_2025-06-24' --> 'data\processed_data\ORCL\4_2025-06-24.md'
Converted 'data\edgar_documents\ORCL\4_2025-06-25' --> 'data\processed_data\ORCL\4_2025-06-25.md'


2025-11-14 17:25:16,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,053 - INFO - Going to convert document batch...
2025-11-14 17:25:16,054 - INFO - Processing document 4_2025-07-01
2025-11-14 17:25:16,086 - INFO - Finished converting document 4_2025-07-01 in 0.05 sec.
2025-11-14 17:25:16,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,133 - INFO - Going to convert document batch...
2025-11-14 17:25:16,134 - INFO - Processing document 4_2025-07-08
2025-11-14 17:25:16,152 - INFO - Finished converting document 4_2025-07-08 in 0.05 sec.
2025-11-14 17:25:16,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,192 - INFO - Going to convert document batch...
2025-11-14 17:25:16,193 - INFO - Processing document 4_2025-07-09
2025-11-14 17:25:16,213 - INFO - Finished converting document 4_2025-07-09 in 0.05 sec.


Converted 'data\edgar_documents\ORCL\4_2025-06-26' --> 'data\processed_data\ORCL\4_2025-06-26.md'
Converted 'data\edgar_documents\ORCL\4_2025-07-01' --> 'data\processed_data\ORCL\4_2025-07-01.md'
Converted 'data\edgar_documents\ORCL\4_2025-07-08' --> 'data\processed_data\ORCL\4_2025-07-08.md'


2025-11-14 17:25:16,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,259 - INFO - Going to convert document batch...
2025-11-14 17:25:16,260 - INFO - Processing document 4_2025-07-11
2025-11-14 17:25:16,287 - INFO - Finished converting document 4_2025-07-11 in 0.05 sec.
2025-11-14 17:25:16,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,346 - INFO - Going to convert document batch...
2025-11-14 17:25:16,347 - INFO - Processing document 4_2025-07-17
2025-11-14 17:25:16,369 - INFO - Finished converting document 4_2025-07-17 in 0.06 sec.
2025-11-14 17:25:16,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,416 - INFO - Going to convert document batch...
2025-11-14 17:25:16,417 - INFO - Processing document 4_2025-07-18


Converted 'data\edgar_documents\ORCL\4_2025-07-09' --> 'data\processed_data\ORCL\4_2025-07-09.md'
Converted 'data\edgar_documents\ORCL\4_2025-07-11' --> 'data\processed_data\ORCL\4_2025-07-11.md'
Converted 'data\edgar_documents\ORCL\4_2025-07-17' --> 'data\processed_data\ORCL\4_2025-07-17.md'


2025-11-14 17:25:16,436 - INFO - Finished converting document 4_2025-07-18 in 0.05 sec.
2025-11-14 17:25:16,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,489 - INFO - Going to convert document batch...
2025-11-14 17:25:16,490 - INFO - Processing document 4_2025-07-28
2025-11-14 17:25:16,518 - INFO - Finished converting document 4_2025-07-28 in 0.06 sec.
2025-11-14 17:25:16,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,588 - INFO - Going to convert document batch...
2025-11-14 17:25:16,588 - INFO - Processing document 4_2025-08-06
2025-11-14 17:25:16,608 - INFO - Finished converting document 4_2025-08-06 in 0.06 sec.
2025-11-14 17:25:16,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\4_2025-07-18' --> 'data\processed_data\ORCL\4_2025-07-18.md'
Converted 'data\edgar_documents\ORCL\4_2025-07-28' --> 'data\processed_data\ORCL\4_2025-07-28.md'
Converted 'data\edgar_documents\ORCL\4_2025-08-06' --> 'data\processed_data\ORCL\4_2025-08-06.md'


2025-11-14 17:25:16,654 - INFO - Going to convert document batch...
2025-11-14 17:25:16,655 - INFO - Processing document 4_2025-08-07
2025-11-14 17:25:16,691 - INFO - Finished converting document 4_2025-08-07 in 0.06 sec.
2025-11-14 17:25:16,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,743 - INFO - Going to convert document batch...
2025-11-14 17:25:16,744 - INFO - Processing document 4_2025-09-16
2025-11-14 17:25:16,765 - INFO - Finished converting document 4_2025-09-16 in 0.05 sec.
2025-11-14 17:25:16,818 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,827 - INFO - Going to convert document batch...
2025-11-14 17:25:16,829 - INFO - Processing document 4_2025-09-17
2025-11-14 17:25:16,850 - INFO - Finished converting document 4_2025-09-17 in 0.05 sec.
2025-11-14 17:25:16,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:16,894 - INFO - Going to convert document batch...
2025-11-14 17:25:16,896 - 

Converted 'data\edgar_documents\ORCL\4_2025-08-07' --> 'data\processed_data\ORCL\4_2025-08-07.md'
Converted 'data\edgar_documents\ORCL\4_2025-09-16' --> 'data\processed_data\ORCL\4_2025-09-16.md'
Converted 'data\edgar_documents\ORCL\4_2025-09-17' --> 'data\processed_data\ORCL\4_2025-09-17.md'


2025-11-14 17:25:16,924 - INFO - Finished converting document 4_2025-09-23 in 0.05 sec.
2025-11-14 17:25:16,972 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:16,972 - ERROR - Input document 4_2025-09-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:25:16,974 - INFO - Going to convert document batch...
2025-11-14 17:25:16,994 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:16,995 - ERROR - Input document 4_2025-09-25 with forma

Converted 'data\edgar_documents\ORCL\4_2025-09-23' --> 'data\processed_data\ORCL\4_2025-09-23.md'
Error processing data\edgar_documents\ORCL\4_2025-09-24: File format not allowed: data\edgar_documents\ORCL\4_2025-09-24
Error processing data\edgar_documents\ORCL\4_2025-09-25: File format not allowed: data\edgar_documents\ORCL\4_2025-09-25
Converted 'data\edgar_documents\ORCL\4_2025-09-26' --> 'data\processed_data\ORCL\4_2025-09-26.md'
Converted 'data\edgar_documents\ORCL\4_2025-09-30' --> 'data\processed_data\ORCL\4_2025-09-30.md'


2025-11-14 17:25:17,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:17,159 - INFO - Going to convert document batch...
2025-11-14 17:25:17,159 - INFO - Processing document 4_2025-10-14
2025-11-14 17:25:17,177 - INFO - Finished converting document 4_2025-10-14 in 0.05 sec.
2025-11-14 17:25:17,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:17,220 - INFO - Going to convert document batch...
2025-11-14 17:25:17,221 - INFO - Processing document 4_2025-10-23
2025-11-14 17:25:17,239 - INFO - Finished converting document 4_2025-10-23 in 0.03 sec.
2025-11-14 17:25:17,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:17,291 - INFO - Going to convert document batch...
2025-11-14 17:25:17,292 - INFO - Processing document 4_2025-10-27
2025-11-14 17:25:17,310 - INFO - Finished converting document 4_2025-10-27 in 0.06 sec.
2025-11-14 17:25:17,343 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\ORCL\4_2025-10-14' --> 'data\processed_data\ORCL\4_2025-10-14.md'
Converted 'data\edgar_documents\ORCL\4_2025-10-23' --> 'data\processed_data\ORCL\4_2025-10-23.md'
Converted 'data\edgar_documents\ORCL\4_2025-10-27' --> 'data\processed_data\ORCL\4_2025-10-27.md'


2025-11-14 17:25:17,413 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:17,423 - INFO - Going to convert document batch...
2025-11-14 17:25:17,424 - INFO - Processing document 8-K_2023-02-06
2025-11-14 17:25:17,442 - INFO - Finished converting document 8-K_2023-02-06 in 0.05 sec.
2025-11-14 17:25:17,493 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:17,494 - ERROR - Input document 8-K_2023-03-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <I

Converted 'data\edgar_documents\ORCL\4_2025-10-30' --> 'data\processed_data\ORCL\4_2025-10-30.md'
Converted 'data\edgar_documents\ORCL\8-K_2023-02-06' --> 'data\processed_data\ORCL\8-K_2023-02-06.md'
Error processing data\edgar_documents\ORCL\8-K_2023-03-09: File format not allowed: data\edgar_documents\ORCL\8-K_2023-03-09
Converted 'data\edgar_documents\ORCL\8-K_2023-06-12' --> 'data\processed_data\ORCL\8-K_2023-06-12.md'


2025-11-14 17:25:17,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:17,597 - INFO - Going to convert document batch...
2025-11-14 17:25:17,598 - INFO - Processing document 8-K_2023-09-11
2025-11-14 17:25:17,612 - INFO - Finished converting document 8-K_2023-09-11 in 0.06 sec.
2025-11-14 17:25:17,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:17,655 - INFO - Going to convert document batch...
2025-11-14 17:25:17,657 - INFO - Processing document 8-K_2023-11-17
2025-11-14 17:25:17,685 - INFO - Finished converting document 8-K_2023-11-17 in 0.06 sec.
2025-11-14 17:25:17,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:17,748 - INFO - Going to convert document batch...
2025-11-14 17:25:17,750 - INFO - Processing document 8-K_2023-12-11
2025-11-14 17:25:17,764 - INFO - Finished converting document 8-K_2023-12-11 in 0.06 sec.
2025-11-14 17:25:17,806 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ORCL\8-K_2023-09-11' --> 'data\processed_data\ORCL\8-K_2023-09-11.md'
Converted 'data\edgar_documents\ORCL\8-K_2023-11-17' --> 'data\processed_data\ORCL\8-K_2023-11-17.md'
Converted 'data\edgar_documents\ORCL\8-K_2023-12-11' --> 'data\processed_data\ORCL\8-K_2023-12-11.md'


2025-11-14 17:25:17,832 - INFO - Going to convert document batch...
2025-11-14 17:25:17,834 - INFO - Processing document 8-K_2024-03-11
2025-11-14 17:25:17,850 - INFO - Finished converting document 8-K_2024-03-11 in 0.08 sec.
2025-11-14 17:25:17,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:17,893 - INFO - Going to convert document batch...
2025-11-14 17:25:17,894 - INFO - Processing document 8-K_2024-06-11
2025-11-14 17:25:17,925 - INFO - Finished converting document 8-K_2024-06-11 in 0.06 sec.
2025-11-14 17:25:17,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:17,967 - INFO - Going to convert document batch...
2025-11-14 17:25:17,967 - INFO - Processing document 8-K_2024-09-09
2025-11-14 17:25:17,983 - INFO - Finished converting document 8-K_2024-09-09 in 0.05 sec.
2025-11-14 17:25:18,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,014 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\ORCL\8-K_2024-03-11' --> 'data\processed_data\ORCL\8-K_2024-03-11.md'
Converted 'data\edgar_documents\ORCL\8-K_2024-06-11' --> 'data\processed_data\ORCL\8-K_2024-06-11.md'
Converted 'data\edgar_documents\ORCL\8-K_2024-09-09' --> 'data\processed_data\ORCL\8-K_2024-09-09.md'


2025-11-14 17:25:18,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,070 - INFO - Going to convert document batch...
2025-11-14 17:25:18,071 - INFO - Processing document 8-K_2024-11-18
2025-11-14 17:25:18,096 - INFO - Finished converting document 8-K_2024-11-18 in 0.05 sec.
2025-11-14 17:25:18,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,157 - INFO - Going to convert document batch...
2025-11-14 17:25:18,158 - INFO - Processing document 8-K_2024-12-09
2025-11-14 17:25:18,173 - INFO - Finished converting document 8-K_2024-12-09 in 0.06 sec.
2025-11-14 17:25:18,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,204 - INFO - Going to convert document batch...
2025-11-14 17:25:18,205 - INFO - Processing document 8-K_2025-01-13
2025-11-14 17:25:18,218 - INFO - Finished converting document 8-K_2025-01-13 in 0.03 sec.


Converted 'data\edgar_documents\ORCL\8-K_2024-09-27' --> 'data\processed_data\ORCL\8-K_2024-09-27.md'
Converted 'data\edgar_documents\ORCL\8-K_2024-11-18' --> 'data\processed_data\ORCL\8-K_2024-11-18.md'
Converted 'data\edgar_documents\ORCL\8-K_2024-12-09' --> 'data\processed_data\ORCL\8-K_2024-12-09.md'
Converted 'data\edgar_documents\ORCL\8-K_2025-01-13' --> 'data\processed_data\ORCL\8-K_2025-01-13.md'


2025-11-14 17:25:18,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,268 - INFO - Going to convert document batch...
2025-11-14 17:25:18,269 - INFO - Processing document 8-K_2025-01-22
2025-11-14 17:25:18,282 - INFO - Finished converting document 8-K_2025-01-22 in 0.06 sec.
2025-11-14 17:25:18,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,334 - INFO - Going to convert document batch...
2025-11-14 17:25:18,335 - INFO - Processing document 8-K_2025-02-03
2025-11-14 17:25:18,370 - INFO - Finished converting document 8-K_2025-02-03 in 0.08 sec.
2025-11-14 17:25:18,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,409 - INFO - Going to convert document batch...
2025-11-14 17:25:18,410 - INFO - Processing document 8-K_2025-02-26
2025-11-14 17:25:18,424 - INFO - Finished converting document 8-K_2025-02-26 in 0.05 sec.
2025-11-14 17:25:18,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ORCL\8-K_2025-01-22' --> 'data\processed_data\ORCL\8-K_2025-01-22.md'
Converted 'data\edgar_documents\ORCL\8-K_2025-02-03' --> 'data\processed_data\ORCL\8-K_2025-02-03.md'
Converted 'data\edgar_documents\ORCL\8-K_2025-02-26' --> 'data\processed_data\ORCL\8-K_2025-02-26.md'


2025-11-14 17:25:18,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,509 - INFO - Going to convert document batch...
2025-11-14 17:25:18,510 - INFO - Processing document 8-K_2025-06-11
2025-11-14 17:25:18,526 - INFO - Finished converting document 8-K_2025-06-11 in 0.05 sec.
2025-11-14 17:25:18,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,559 - INFO - Going to convert document batch...
2025-11-14 17:25:18,561 - INFO - Processing document 8-K_2025-06-30
2025-11-14 17:25:18,576 - INFO - Finished converting document 8-K_2025-06-30 in 0.05 sec.
2025-11-14 17:25:18,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,607 - INFO - Going to convert document batch...
2025-11-14 17:25:18,608 - INFO - Processing document 8-K_2025-09-09
2025-11-14 17:25:18,623 - INFO - Finished converting document 8-K_2025-09-09 in 0.05 sec.
2025-11-14 17:25:18,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ORCL\8-K_2025-03-10' --> 'data\processed_data\ORCL\8-K_2025-03-10.md'
Converted 'data\edgar_documents\ORCL\8-K_2025-06-11' --> 'data\processed_data\ORCL\8-K_2025-06-11.md'
Converted 'data\edgar_documents\ORCL\8-K_2025-06-30' --> 'data\processed_data\ORCL\8-K_2025-06-30.md'
Converted 'data\edgar_documents\ORCL\8-K_2025-09-09' --> 'data\processed_data\ORCL\8-K_2025-09-09.md'


2025-11-14 17:25:18,674 - INFO - Processing document 8-K_2025-09-22
2025-11-14 17:25:18,689 - INFO - Finished converting document 8-K_2025-09-22 in 0.06 sec.
2025-11-14 17:25:18,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,727 - INFO - Going to convert document batch...
2025-11-14 17:25:18,728 - INFO - Processing document 8-K_2025-09-26
2025-11-14 17:25:18,746 - INFO - Finished converting document 8-K_2025-09-26 in 0.05 sec.
2025-11-14 17:25:18,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:18,802 - INFO - Going to convert document batch...
2025-11-14 17:25:18,804 - INFO - Processing document 8-K_2025-10-06
2025-11-14 17:25:18,818 - INFO - Finished converting document 8-K_2025-10-06 in 0.05 sec.
2025-11-14 17:25:18,857 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:18,858 - ERROR - Input document DEF-14A_2023-09-22 with format None does not match any 

Converted 'data\edgar_documents\ORCL\8-K_2025-09-22' --> 'data\processed_data\ORCL\8-K_2025-09-22.md'
Converted 'data\edgar_documents\ORCL\8-K_2025-09-26' --> 'data\processed_data\ORCL\8-K_2025-09-26.md'
Converted 'data\edgar_documents\ORCL\8-K_2025-10-06' --> 'data\processed_data\ORCL\8-K_2025-10-06.md'
Error processing data\edgar_documents\ORCL\DEF-14A_2023-09-22: File format not allowed: data\edgar_documents\ORCL\DEF-14A_2023-09-22


2025-11-14 17:25:18,894 - ERROR - Input document DEF-14A_2024-09-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:25:18,896 - INFO - Going to convert document batch...
2025-11-14 17:25:18,928 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:18,929 - ERROR - Input document DEF-14A_2025-09-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: '

Error processing data\edgar_documents\ORCL\DEF-14A_2024-09-25: File format not allowed: data\edgar_documents\ORCL\DEF-14A_2024-09-25
Error processing data\edgar_documents\ORCL\DEF-14A_2025-09-26: File format not allowed: data\edgar_documents\ORCL\DEF-14A_2025-09-26
Processed 119 new files. Errors: 13
Found 82 files to process in data\edgar_documents\PEP


2025-11-14 17:25:20,339 - INFO - Going to convert document batch...
2025-11-14 17:25:20,340 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:25:20,340 - INFO - Processing document 10-K_2023-02-09
2025-11-14 17:25:22,537 - INFO - Finished converting document 10-K_2023-02-09 in 3.59 sec.
2025-11-14 17:25:23,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-K_2023-02-09' --> 'data\processed_data\PEP\10-K_2023-02-09.md'


2025-11-14 17:25:24,390 - INFO - Going to convert document batch...
2025-11-14 17:25:24,391 - INFO - Processing document 10-K_2024-02-09
2025-11-14 17:25:26,708 - INFO - Finished converting document 10-K_2024-02-09 in 3.45 sec.
2025-11-14 17:25:27,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-K_2024-02-09' --> 'data\processed_data\PEP\10-K_2024-02-09.md'


2025-11-14 17:25:28,780 - INFO - Going to convert document batch...
2025-11-14 17:25:28,780 - INFO - Processing document 10-K_2025-02-04
2025-11-14 17:25:31,071 - INFO - Finished converting document 10-K_2025-02-04 in 3.61 sec.
2025-11-14 17:25:31,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-K_2025-02-04' --> 'data\processed_data\PEP\10-K_2025-02-04.md'


2025-11-14 17:25:32,710 - INFO - Going to convert document batch...
2025-11-14 17:25:32,711 - INFO - Processing document 10-Q_2023-04-25
2025-11-14 17:25:33,479 - INFO - Finished converting document 10-Q_2023-04-25 in 1.66 sec.
2025-11-14 17:25:33,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-Q_2023-04-25' --> 'data\processed_data\PEP\10-Q_2023-04-25.md'


2025-11-14 17:25:34,445 - INFO - Going to convert document batch...
2025-11-14 17:25:34,446 - INFO - Processing document 10-Q_2023-07-13
2025-11-14 17:25:35,551 - INFO - Finished converting document 10-Q_2023-07-13 in 1.67 sec.
2025-11-14 17:25:36,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-Q_2023-07-13' --> 'data\processed_data\PEP\10-Q_2023-07-13.md'


2025-11-14 17:25:37,177 - INFO - Going to convert document batch...
2025-11-14 17:25:37,178 - INFO - Processing document 10-Q_2023-10-10
2025-11-14 17:25:38,362 - INFO - Finished converting document 10-Q_2023-10-10 in 2.25 sec.
2025-11-14 17:25:38,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-Q_2023-10-10' --> 'data\processed_data\PEP\10-Q_2023-10-10.md'


2025-11-14 17:25:39,695 - INFO - Going to convert document batch...
2025-11-14 17:25:39,696 - INFO - Processing document 10-Q_2024-04-23
2025-11-14 17:25:40,476 - INFO - Finished converting document 10-Q_2024-04-23 in 1.52 sec.
2025-11-14 17:25:40,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-Q_2024-04-23' --> 'data\processed_data\PEP\10-Q_2024-04-23.md'


2025-11-14 17:25:41,431 - INFO - Going to convert document batch...
2025-11-14 17:25:41,432 - INFO - Processing document 10-Q_2024-07-11
2025-11-14 17:25:42,887 - INFO - Finished converting document 10-Q_2024-07-11 in 2.00 sec.
2025-11-14 17:25:43,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-Q_2024-07-11' --> 'data\processed_data\PEP\10-Q_2024-07-11.md'


2025-11-14 17:25:44,003 - INFO - Going to convert document batch...
2025-11-14 17:25:44,004 - INFO - Processing document 10-Q_2024-10-08
2025-11-14 17:25:45,074 - INFO - Finished converting document 10-Q_2024-10-08 in 1.70 sec.
2025-11-14 17:25:45,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-Q_2024-10-08' --> 'data\processed_data\PEP\10-Q_2024-10-08.md'


2025-11-14 17:25:46,366 - INFO - Going to convert document batch...
2025-11-14 17:25:46,367 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 17:25:47,080 - INFO - Finished converting document 10-Q_2025-04-24 in 1.47 sec.
2025-11-14 17:25:47,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-Q_2025-04-24' --> 'data\processed_data\PEP\10-Q_2025-04-24.md'


2025-11-14 17:25:48,009 - INFO - Going to convert document batch...
2025-11-14 17:25:48,009 - INFO - Processing document 10-Q_2025-07-17
2025-11-14 17:25:49,563 - INFO - Finished converting document 10-Q_2025-07-17 in 2.14 sec.
2025-11-14 17:25:50,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\10-Q_2025-07-17' --> 'data\processed_data\PEP\10-Q_2025-07-17.md'


2025-11-14 17:25:50,795 - INFO - Going to convert document batch...
2025-11-14 17:25:50,796 - INFO - Processing document 10-Q_2025-10-09
2025-11-14 17:25:52,398 - INFO - Finished converting document 10-Q_2025-10-09 in 2.28 sec.
2025-11-14 17:25:53,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:53,023 - INFO - Going to convert document batch...
2025-11-14 17:25:53,024 - INFO - Processing document 4_2023-01-04
2025-11-14 17:25:53,050 - INFO - Finished converting document 4_2023-01-04 in 0.08 sec.
2025-11-14 17:25:53,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:53,116 - INFO - Going to convert document batch...
2025-11-14 17:25:53,117 - INFO - Processing document 4_2023-01-10
2025-11-14 17:25:53,136 - INFO - Finished converting document 4_2023-01-10 in 0.06 sec.
2025-11-14 17:25:53,177 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\PEP\10-Q_2025-10-09' --> 'data\processed_data\PEP\10-Q_2025-10-09.md'
Converted 'data\edgar_documents\PEP\4_2023-01-04' --> 'data\processed_data\PEP\4_2023-01-04.md'
Converted 'data\edgar_documents\PEP\4_2023-01-10' --> 'data\processed_data\PEP\4_2023-01-10.md'


2025-11-14 17:25:53,178 - ERROR - Input document 4_2023-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:25:53,180 - INFO - Going to convert document batch...
2025-11-14 17:25:53,204 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:53,205 - ERROR - Input document 4_2023-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\PEP\4_2023-02-13: File format not allowed: data\edgar_documents\PEP\4_2023-02-13
Error processing data\edgar_documents\PEP\4_2023-02-14: File format not allowed: data\edgar_documents\PEP\4_2023-02-14
Converted 'data\edgar_documents\PEP\4_2023-03-03' --> 'data\processed_data\PEP\4_2023-03-03.md'
Converted 'data\edgar_documents\PEP\4_2023-03-09' --> 'data\processed_data\PEP\4_2023-03-09.md'


2025-11-14 17:25:53,355 - INFO - Processing document 4_2023-03-13
2025-11-14 17:25:53,380 - INFO - Finished converting document 4_2023-03-13 in 0.05 sec.
2025-11-14 17:25:53,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:53,452 - INFO - Going to convert document batch...
2025-11-14 17:25:53,453 - INFO - Processing document 4_2023-05-05
2025-11-14 17:25:53,473 - INFO - Finished converting document 4_2023-05-05 in 0.05 sec.
2025-11-14 17:25:53,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:53,521 - INFO - Going to convert document batch...
2025-11-14 17:25:53,522 - INFO - Processing document 4_2023-06-05
2025-11-14 17:25:53,543 - INFO - Finished converting document 4_2023-06-05 in 0.05 sec.
2025-11-14 17:25:53,580 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:53,589 - INFO - Going to convert document batch...
2025-11-14 17:25:53,590 - INFO - Processing document 4_2023-10-03
2025-11-14 17:25:53,610 - IN

Converted 'data\edgar_documents\PEP\4_2023-03-13' --> 'data\processed_data\PEP\4_2023-03-13.md'
Converted 'data\edgar_documents\PEP\4_2023-05-05' --> 'data\processed_data\PEP\4_2023-05-05.md'
Converted 'data\edgar_documents\PEP\4_2023-06-05' --> 'data\processed_data\PEP\4_2023-06-05.md'


2025-11-14 17:25:53,673 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:53,674 - ERROR - Input document 4_2023-11-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:25:53,675 - INFO - Going to convert document batch...
2025-11-14 17:25:53,697 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:53,698 - ERROR - Input document 4_2023-11-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\PEP\4_2023-10-03' --> 'data\processed_data\PEP\4_2023-10-03.md'
Error processing data\edgar_documents\PEP\4_2023-11-08: File format not allowed: data\edgar_documents\PEP\4_2023-11-08
Error processing data\edgar_documents\PEP\4_2023-11-09: File format not allowed: data\edgar_documents\PEP\4_2023-11-09
Converted 'data\edgar_documents\PEP\4_2023-11-14' --> 'data\processed_data\PEP\4_2023-11-14.md'


2025-11-14 17:25:53,817 - INFO - Going to convert document batch...
2025-11-14 17:25:53,818 - INFO - Processing document 4_2023-12-05
2025-11-14 17:25:53,839 - INFO - Finished converting document 4_2023-12-05 in 0.05 sec.
2025-11-14 17:25:53,885 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:53,886 - ERROR - Input document 4_2024-02-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:25:53,887 - INFO - Going to convert document batch...
2025-11-14 17:25:53,913 - IN

Converted 'data\edgar_documents\PEP\4_2023-12-05' --> 'data\processed_data\PEP\4_2023-12-05.md'
Error processing data\edgar_documents\PEP\4_2024-02-12: File format not allowed: data\edgar_documents\PEP\4_2024-02-12
Error processing data\edgar_documents\PEP\4_2024-02-13: File format not allowed: data\edgar_documents\PEP\4_2024-02-13
Converted 'data\edgar_documents\PEP\4_2024-02-27' --> 'data\processed_data\PEP\4_2024-02-27.md'
Converted 'data\edgar_documents\PEP\4_2024-03-05' --> 'data\processed_data\PEP\4_2024-03-05.md'


2025-11-14 17:25:54,081 - INFO - Going to convert document batch...
2025-11-14 17:25:54,083 - INFO - Processing document 4_2024-03-08
2025-11-14 17:25:54,107 - INFO - Finished converting document 4_2024-03-08 in 0.08 sec.
2025-11-14 17:25:54,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:54,158 - INFO - Going to convert document batch...
2025-11-14 17:25:54,160 - INFO - Processing document 4_2024-03-13
2025-11-14 17:25:54,183 - INFO - Finished converting document 4_2024-03-13 in 0.06 sec.
2025-11-14 17:25:54,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:54,225 - INFO - Going to convert document batch...
2025-11-14 17:25:54,226 - INFO - Processing document 4_2024-05-13
2025-11-14 17:25:54,247 - INFO - Finished converting document 4_2024-05-13 in 0.05 sec.
2025-11-14 17:25:54,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:54,288 - INFO - Going to convert document batch...
2025-11-14 17:25:54,289 - 

Converted 'data\edgar_documents\PEP\4_2024-03-08' --> 'data\processed_data\PEP\4_2024-03-08.md'
Converted 'data\edgar_documents\PEP\4_2024-03-13' --> 'data\processed_data\PEP\4_2024-03-13.md'
Converted 'data\edgar_documents\PEP\4_2024-05-13' --> 'data\processed_data\PEP\4_2024-05-13.md'


2025-11-14 17:25:54,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:54,347 - INFO - Going to convert document batch...
2025-11-14 17:25:54,348 - INFO - Processing document 4_2024-06-04
2025-11-14 17:25:54,367 - INFO - Finished converting document 4_2024-06-04 in 0.03 sec.
2025-11-14 17:25:54,438 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:54,438 - ERROR - Input document 4_2024-07-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:25

Converted 'data\edgar_documents\PEP\4_2024-05-14' --> 'data\processed_data\PEP\4_2024-05-14.md'
Converted 'data\edgar_documents\PEP\4_2024-06-04' --> 'data\processed_data\PEP\4_2024-06-04.md'
Error processing data\edgar_documents\PEP\4_2024-07-15: File format not allowed: data\edgar_documents\PEP\4_2024-07-15
Error processing data\edgar_documents\PEP\4_2024-07-16: File format not allowed: data\edgar_documents\PEP\4_2024-07-16


2025-11-14 17:25:54,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:54,549 - INFO - Going to convert document batch...
2025-11-14 17:25:54,550 - INFO - Processing document 4_2024-12-03
2025-11-14 17:25:54,572 - INFO - Finished converting document 4_2024-12-03 in 0.03 sec.
2025-11-14 17:25:54,615 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:54,616 - ERROR - Input document 4_2025-02-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:25

Converted 'data\edgar_documents\PEP\4_2024-10-03' --> 'data\processed_data\PEP\4_2024-10-03.md'
Converted 'data\edgar_documents\PEP\4_2024-12-03' --> 'data\processed_data\PEP\4_2024-12-03.md'
Error processing data\edgar_documents\PEP\4_2025-02-05: File format not allowed: data\edgar_documents\PEP\4_2025-02-05
Error processing data\edgar_documents\PEP\4_2025-02-06: File format not allowed: data\edgar_documents\PEP\4_2025-02-06
Converted 'data\edgar_documents\PEP\4_2025-03-03' --> 'data\processed_data\PEP\4_2025-03-03.md'


2025-11-14 17:25:54,751 - INFO - Going to convert document batch...
2025-11-14 17:25:54,752 - INFO - Processing document 4_2025-03-04
2025-11-14 17:25:54,774 - INFO - Finished converting document 4_2025-03-04 in 0.03 sec.
2025-11-14 17:25:54,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:54,828 - INFO - Going to convert document batch...
2025-11-14 17:25:54,830 - INFO - Processing document 4_2025-03-06
2025-11-14 17:25:54,848 - INFO - Finished converting document 4_2025-03-06 in 0.03 sec.
2025-11-14 17:25:54,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:54,907 - INFO - Going to convert document batch...
2025-11-14 17:25:54,908 - INFO - Processing document 4_2025-06-03
2025-11-14 17:25:54,929 - INFO - Finished converting document 4_2025-06-03 in 0.06 sec.
2025-11-14 17:25:54,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:54,988 - INFO - Going to convert document batch...
2025-11-14 17:25:54,989 - 

Converted 'data\edgar_documents\PEP\4_2025-03-04' --> 'data\processed_data\PEP\4_2025-03-04.md'
Converted 'data\edgar_documents\PEP\4_2025-03-06' --> 'data\processed_data\PEP\4_2025-03-06.md'
Converted 'data\edgar_documents\PEP\4_2025-06-03' --> 'data\processed_data\PEP\4_2025-06-03.md'


2025-11-14 17:25:55,053 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:55,054 - ERROR - Input document 4_2025-07-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:25:55,056 - INFO - Going to convert document batch...
2025-11-14 17:25:55,081 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:25:55,082 - ERROR - Input document 4_2025-07-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\PEP\4_2025-07-03' --> 'data\processed_data\PEP\4_2025-07-03.md'
Error processing data\edgar_documents\PEP\4_2025-07-21: File format not allowed: data\edgar_documents\PEP\4_2025-07-21
Error processing data\edgar_documents\PEP\4_2025-07-22: File format not allowed: data\edgar_documents\PEP\4_2025-07-22
Converted 'data\edgar_documents\PEP\4_2025-10-03' --> 'data\processed_data\PEP\4_2025-10-03.md'


2025-11-14 17:25:55,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:55,254 - INFO - Going to convert document batch...
2025-11-14 17:25:55,255 - INFO - Processing document 8-K_2023-02-15
2025-11-14 17:25:55,313 - INFO - Finished converting document 8-K_2023-02-15 in 0.09 sec.
2025-11-14 17:25:55,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:55,377 - INFO - Going to convert document batch...
2025-11-14 17:25:55,378 - INFO - Processing document 8-K_2023-04-25
2025-11-14 17:25:55,401 - INFO - Finished converting document 8-K_2023-04-25 in 0.06 sec.


Converted 'data\edgar_documents\PEP\8-K_2023-02-09' --> 'data\processed_data\PEP\8-K_2023-02-09.md'
Converted 'data\edgar_documents\PEP\8-K_2023-02-15' --> 'data\processed_data\PEP\8-K_2023-02-15.md'


2025-11-14 17:25:55,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:55,474 - INFO - Going to convert document batch...
2025-11-14 17:25:55,475 - INFO - Processing document 8-K_2023-05-05
2025-11-14 17:25:55,528 - INFO - Finished converting document 8-K_2023-05-05 in 0.12 sec.
2025-11-14 17:25:55,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:55,587 - INFO - Going to convert document batch...
2025-11-14 17:25:55,587 - INFO - Processing document 8-K_2023-05-30


Converted 'data\edgar_documents\PEP\8-K_2023-04-25' --> 'data\processed_data\PEP\8-K_2023-04-25.md'
Converted 'data\edgar_documents\PEP\8-K_2023-05-05' --> 'data\processed_data\PEP\8-K_2023-05-05.md'


2025-11-14 17:25:55,622 - INFO - Finished converting document 8-K_2023-05-30 in 0.08 sec.
2025-11-14 17:25:55,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:55,688 - INFO - Going to convert document batch...
2025-11-14 17:25:55,689 - INFO - Processing document 8-K_2023-07-13
2025-11-14 17:25:55,729 - INFO - Finished converting document 8-K_2023-07-13 in 0.09 sec.
2025-11-14 17:25:55,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:55,779 - INFO - Going to convert document batch...
2025-11-14 17:25:55,780 - INFO - Processing document 8-K_2023-10-10
2025-11-14 17:25:55,807 - INFO - Finished converting document 8-K_2023-10-10 in 0.06 sec.
2025-11-14 17:25:55,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\8-K_2023-05-30' --> 'data\processed_data\PEP\8-K_2023-05-30.md'
Converted 'data\edgar_documents\PEP\8-K_2023-07-13' --> 'data\processed_data\PEP\8-K_2023-07-13.md'
Converted 'data\edgar_documents\PEP\8-K_2023-10-10' --> 'data\processed_data\PEP\8-K_2023-10-10.md'


2025-11-14 17:25:55,847 - INFO - Going to convert document batch...
2025-11-14 17:25:55,848 - INFO - Processing document 8-K_2023-11-06
2025-11-14 17:25:55,871 - INFO - Finished converting document 8-K_2023-11-06 in 0.06 sec.
2025-11-14 17:25:55,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:55,922 - INFO - Going to convert document batch...
2025-11-14 17:25:55,923 - INFO - Processing document 8-K_2023-11-13
2025-11-14 17:25:55,975 - INFO - Finished converting document 8-K_2023-11-13 in 0.09 sec.
2025-11-14 17:25:56,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:56,040 - INFO - Going to convert document batch...
2025-11-14 17:25:56,041 - INFO - Processing document 8-K_2023-11-17


Converted 'data\edgar_documents\PEP\8-K_2023-11-06' --> 'data\processed_data\PEP\8-K_2023-11-06.md'
Converted 'data\edgar_documents\PEP\8-K_2023-11-13' --> 'data\processed_data\PEP\8-K_2023-11-13.md'


2025-11-14 17:25:56,064 - INFO - Finished converting document 8-K_2023-11-17 in 0.06 sec.
2025-11-14 17:25:56,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:56,120 - INFO - Going to convert document batch...
2025-11-14 17:25:56,122 - INFO - Processing document 8-K_2024-01-18
2025-11-14 17:25:56,167 - INFO - Finished converting document 8-K_2024-01-18 in 0.09 sec.
2025-11-14 17:25:56,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:56,217 - INFO - Going to convert document batch...
2025-11-14 17:25:56,218 - INFO - Processing document 8-K_2024-02-09
2025-11-14 17:25:56,243 - INFO - Finished converting document 8-K_2024-02-09 in 0.05 sec.
2025-11-14 17:25:56,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\8-K_2023-11-17' --> 'data\processed_data\PEP\8-K_2023-11-17.md'
Converted 'data\edgar_documents\PEP\8-K_2024-01-18' --> 'data\processed_data\PEP\8-K_2024-01-18.md'
Converted 'data\edgar_documents\PEP\8-K_2024-02-09' --> 'data\processed_data\PEP\8-K_2024-02-09.md'


2025-11-14 17:25:56,291 - INFO - Going to convert document batch...
2025-11-14 17:25:56,292 - INFO - Processing document 8-K_2024-02-16
2025-11-14 17:25:56,350 - INFO - Finished converting document 8-K_2024-02-16 in 0.09 sec.
2025-11-14 17:25:56,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:56,413 - INFO - Going to convert document batch...
2025-11-14 17:25:56,413 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:25:56,438 - INFO - Finished converting document 8-K_2024-04-23 in 0.06 sec.
2025-11-14 17:25:56,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:56,489 - INFO - Going to convert document batch...
2025-11-14 17:25:56,490 - INFO - Processing document 8-K_2024-05-03
2025-11-14 17:25:56,542 - INFO - Finished converting document 8-K_2024-05-03 in 0.09 sec.


Converted 'data\edgar_documents\PEP\8-K_2024-02-16' --> 'data\processed_data\PEP\8-K_2024-02-16.md'
Converted 'data\edgar_documents\PEP\8-K_2024-04-23' --> 'data\processed_data\PEP\8-K_2024-04-23.md'
Converted 'data\edgar_documents\PEP\8-K_2024-05-03' --> 'data\processed_data\PEP\8-K_2024-05-03.md'


2025-11-14 17:25:56,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:56,599 - INFO - Going to convert document batch...
2025-11-14 17:25:56,600 - INFO - Processing document 8-K_2024-05-24
2025-11-14 17:25:56,648 - INFO - Finished converting document 8-K_2024-05-24 in 0.08 sec.
2025-11-14 17:25:56,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:56,734 - INFO - Going to convert document batch...
2025-11-14 17:25:56,736 - INFO - Processing document 8-K_2024-07-11
2025-11-14 17:25:56,759 - INFO - Finished converting document 8-K_2024-07-11 in 0.06 sec.
2025-11-14 17:25:56,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:56,804 - INFO - Going to convert document batch...
2025-11-14 17:25:56,806 - INFO - Processing document 8-K_2024-07-17
2025-11-14 17:25:56,850 - INFO - Finished converting document 8-K_2024-07-17 in 0.08 sec.


Converted 'data\edgar_documents\PEP\8-K_2024-05-24' --> 'data\processed_data\PEP\8-K_2024-05-24.md'
Converted 'data\edgar_documents\PEP\8-K_2024-07-11' --> 'data\processed_data\PEP\8-K_2024-07-11.md'
Converted 'data\edgar_documents\PEP\8-K_2024-07-17' --> 'data\processed_data\PEP\8-K_2024-07-17.md'


2025-11-14 17:25:56,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:56,930 - INFO - Going to convert document batch...
2025-11-14 17:25:56,931 - INFO - Processing document 8-K_2024-09-20
2025-11-14 17:25:56,958 - INFO - Finished converting document 8-K_2024-09-20 in 0.08 sec.
2025-11-14 17:25:56,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:57,000 - INFO - Going to convert document batch...
2025-11-14 17:25:57,001 - INFO - Processing document 8-K_2024-10-08
2025-11-14 17:25:57,025 - INFO - Finished converting document 8-K_2024-10-08 in 0.05 sec.
2025-11-14 17:25:57,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:57,081 - INFO - Going to convert document batch...
2025-11-14 17:25:57,082 - INFO - Processing document 8-K_2024-12-11
2025-11-14 17:25:57,106 - INFO - Finished converting document 8-K_2024-12-11 in 0.08 sec.
2025-11-14 17:25:57,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\PEP\8-K_2024-09-20' --> 'data\processed_data\PEP\8-K_2024-09-20.md'
Converted 'data\edgar_documents\PEP\8-K_2024-10-08' --> 'data\processed_data\PEP\8-K_2024-10-08.md'
Converted 'data\edgar_documents\PEP\8-K_2024-12-11' --> 'data\processed_data\PEP\8-K_2024-12-11.md'


2025-11-14 17:25:57,173 - INFO - Finished converting document 8-K_2025-02-04 in 0.06 sec.
2025-11-14 17:25:57,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:57,212 - INFO - Going to convert document batch...
2025-11-14 17:25:57,213 - INFO - Processing document 8-K_2025-02-07
2025-11-14 17:25:57,235 - INFO - Finished converting document 8-K_2025-02-07 in 0.05 sec.
2025-11-14 17:25:57,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:57,275 - INFO - Going to convert document batch...
2025-11-14 17:25:57,276 - INFO - Processing document 8-K_2025-04-24
2025-11-14 17:25:57,298 - INFO - Finished converting document 8-K_2025-04-24 in 0.05 sec.
2025-11-14 17:25:57,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:57,347 - INFO - Going to convert document batch...
2025-11-14 17:25:57,348 - INFO - Processing document 8-K_2025-05-09
2025-11-14 17:25:57,387 - INFO - Finished converting document 8-K_2025-05-09 in 0.

Converted 'data\edgar_documents\PEP\8-K_2025-02-04' --> 'data\processed_data\PEP\8-K_2025-02-04.md'
Converted 'data\edgar_documents\PEP\8-K_2025-02-07' --> 'data\processed_data\PEP\8-K_2025-02-07.md'
Converted 'data\edgar_documents\PEP\8-K_2025-04-24' --> 'data\processed_data\PEP\8-K_2025-04-24.md'


2025-11-14 17:25:57,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:57,472 - INFO - Going to convert document batch...
2025-11-14 17:25:57,473 - INFO - Processing document 8-K_2025-05-23
2025-11-14 17:25:57,514 - INFO - Finished converting document 8-K_2025-05-23 in 0.11 sec.
2025-11-14 17:25:57,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:57,582 - INFO - Going to convert document batch...
2025-11-14 17:25:57,583 - INFO - Processing document 8-K_2025-07-17
2025-11-14 17:25:57,607 - INFO - Finished converting document 8-K_2025-07-17 in 0.08 sec.


Converted 'data\edgar_documents\PEP\8-K_2025-05-09' --> 'data\processed_data\PEP\8-K_2025-05-09.md'
Converted 'data\edgar_documents\PEP\8-K_2025-05-23' --> 'data\processed_data\PEP\8-K_2025-05-23.md'


2025-11-14 17:25:57,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:57,652 - INFO - Going to convert document batch...
2025-11-14 17:25:57,653 - INFO - Processing document 8-K_2025-07-23


Converted 'data\edgar_documents\PEP\8-K_2025-07-17' --> 'data\processed_data\PEP\8-K_2025-07-17.md'


2025-11-14 17:25:58,139 - INFO - Finished converting document 8-K_2025-07-23 in 0.52 sec.
2025-11-14 17:25:58,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:58,206 - INFO - Going to convert document batch...
2025-11-14 17:25:58,206 - INFO - Processing document 8-K_2025-07-28
2025-11-14 17:25:58,249 - INFO - Finished converting document 8-K_2025-07-28 in 0.09 sec.
2025-11-14 17:25:58,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:25:58,326 - INFO - Going to convert document batch...
2025-11-14 17:25:58,327 - INFO - Processing document 8-K_2025-10-09
2025-11-14 17:25:58,352 - INFO - Finished converting document 8-K_2025-10-09 in 0.08 sec.


Converted 'data\edgar_documents\PEP\8-K_2025-07-23' --> 'data\processed_data\PEP\8-K_2025-07-23.md'
Converted 'data\edgar_documents\PEP\8-K_2025-07-28' --> 'data\processed_data\PEP\8-K_2025-07-28.md'


2025-11-14 17:25:58,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\8-K_2025-10-09' --> 'data\processed_data\PEP\8-K_2025-10-09.md'


2025-11-14 17:25:59,081 - INFO - Going to convert document batch...
2025-11-14 17:25:59,082 - INFO - Processing document DEF-14A_2023-03-21
2025-11-14 17:26:16,926 - INFO - Finished converting document DEF-14A_2023-03-21 in 18.56 sec.
2025-11-14 17:26:18,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\DEF-14A_2023-03-21' --> 'data\processed_data\PEP\DEF-14A_2023-03-21.md'


2025-11-14 17:26:19,027 - INFO - Going to convert document batch...
2025-11-14 17:26:19,028 - INFO - Processing document DEF-14A_2024-03-22
2025-11-14 17:26:28,730 - INFO - Finished converting document DEF-14A_2024-03-22 in 10.62 sec.
2025-11-14 17:26:30,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\DEF-14A_2024-03-22' --> 'data\processed_data\PEP\DEF-14A_2024-03-22.md'


2025-11-14 17:26:30,913 - INFO - Going to convert document batch...
2025-11-14 17:26:30,914 - INFO - Processing document DEF-14A_2025-03-28
2025-11-14 17:26:32,351 - INFO - Finished converting document DEF-14A_2025-03-28 in 2.33 sec.
2025-11-14 17:26:34,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PEP\DEF-14A_2025-03-28' --> 'data\processed_data\PEP\DEF-14A_2025-03-28.md'
Processed 70 new files. Errors: 12
Found 149 files to process in data\edgar_documents\PFE


2025-11-14 17:26:35,672 - INFO - Going to convert document batch...
2025-11-14 17:26:35,673 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:26:35,674 - INFO - Processing document 10-K_2023-02-23
2025-11-14 17:26:38,992 - INFO - Finished converting document 10-K_2023-02-23 in 5.03 sec.
2025-11-14 17:26:40,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-K_2023-02-23' --> 'data\processed_data\PFE\10-K_2023-02-23.md'


2025-11-14 17:26:42,204 - INFO - Going to convert document batch...
2025-11-14 17:26:42,205 - INFO - Processing document 10-K_2024-02-22
2025-11-14 17:26:46,115 - INFO - Finished converting document 10-K_2024-02-22 in 5.51 sec.
2025-11-14 17:26:47,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-K_2024-02-22' --> 'data\processed_data\PFE\10-K_2024-02-22.md'


2025-11-14 17:26:49,660 - INFO - Going to convert document batch...
2025-11-14 17:26:49,661 - INFO - Processing document 10-K_2025-02-27
2025-11-14 17:26:53,043 - INFO - Finished converting document 10-K_2025-02-27 in 5.27 sec.
2025-11-14 17:26:54,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-K_2025-02-27' --> 'data\processed_data\PFE\10-K_2025-02-27.md'


2025-11-14 17:26:55,925 - INFO - Going to convert document batch...
2025-11-14 17:26:55,926 - INFO - Processing document 10-Q_2023-05-10
2025-11-14 17:26:57,275 - INFO - Finished converting document 10-Q_2023-05-10 in 2.61 sec.
2025-11-14 17:26:58,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-Q_2023-05-10' --> 'data\processed_data\PFE\10-Q_2023-05-10.md'


2025-11-14 17:26:58,903 - INFO - Going to convert document batch...
2025-11-14 17:26:58,904 - INFO - Processing document 10-Q_2023-08-09
2025-11-14 17:27:01,129 - INFO - Finished converting document 10-Q_2023-08-09 in 2.97 sec.
2025-11-14 17:27:02,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-Q_2023-08-09' --> 'data\processed_data\PFE\10-Q_2023-08-09.md'


2025-11-14 17:27:02,980 - INFO - Going to convert document batch...
2025-11-14 17:27:02,981 - INFO - Processing document 10-Q_2023-11-08
2025-11-14 17:27:05,007 - INFO - Finished converting document 10-Q_2023-11-08 in 2.84 sec.
2025-11-14 17:27:06,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-Q_2023-11-08' --> 'data\processed_data\PFE\10-Q_2023-11-08.md'


2025-11-14 17:27:06,654 - INFO - Going to convert document batch...
2025-11-14 17:27:06,655 - INFO - Processing document 10-Q_2024-05-08
2025-11-14 17:27:08,041 - INFO - Finished converting document 10-Q_2024-05-08 in 2.03 sec.
2025-11-14 17:27:08,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-Q_2024-05-08' --> 'data\processed_data\PFE\10-Q_2024-05-08.md'


2025-11-14 17:27:10,192 - INFO - Going to convert document batch...
2025-11-14 17:27:10,193 - INFO - Processing document 10-Q_2024-08-05
2025-11-14 17:27:11,912 - INFO - Finished converting document 10-Q_2024-08-05 in 2.98 sec.
2025-11-14 17:27:13,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-Q_2024-08-05' --> 'data\processed_data\PFE\10-Q_2024-08-05.md'


2025-11-14 17:27:14,058 - INFO - Going to convert document batch...
2025-11-14 17:27:14,059 - INFO - Processing document 10-Q_2024-11-04
2025-11-14 17:27:16,042 - INFO - Finished converting document 10-Q_2024-11-04 in 2.73 sec.
2025-11-14 17:27:17,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-Q_2024-11-04' --> 'data\processed_data\PFE\10-Q_2024-11-04.md'


2025-11-14 17:27:17,675 - INFO - Going to convert document batch...
2025-11-14 17:27:17,676 - INFO - Processing document 10-Q_2025-05-05
2025-11-14 17:27:18,891 - INFO - Finished converting document 10-Q_2025-05-05 in 1.88 sec.
2025-11-14 17:27:19,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-Q_2025-05-05' --> 'data\processed_data\PFE\10-Q_2025-05-05.md'


2025-11-14 17:27:20,923 - INFO - Going to convert document batch...
2025-11-14 17:27:20,924 - INFO - Processing document 10-Q_2025-08-05
2025-11-14 17:27:22,493 - INFO - Finished converting document 10-Q_2025-08-05 in 2.75 sec.
2025-11-14 17:27:23,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\10-Q_2025-08-05' --> 'data\processed_data\PFE\10-Q_2025-08-05.md'


2025-11-14 17:27:24,470 - INFO - Going to convert document batch...
2025-11-14 17:27:24,472 - INFO - Processing document 10-Q_2025-11-04
2025-11-14 17:27:25,966 - INFO - Finished converting document 10-Q_2025-11-04 in 2.55 sec.
2025-11-14 17:27:26,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:26,903 - INFO - Going to convert document batch...
2025-11-14 17:27:26,904 - INFO - Processing document 4_2023-01-03
2025-11-14 17:27:26,922 - INFO - Finished converting document 4_2023-01-03 in 0.05 sec.
2025-11-14 17:27:26,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:26,966 - INFO - Going to convert document batch...
2025-11-14 17:27:26,967 - INFO - Processing document 4_2023-01-13
2025-11-14 17:27:26,985 - INFO - Finished converting document 4_2023-01-13 in 0.05 sec.
2025-11-14 17:27:27,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,040 - INFO - Going to convert document batch...
2025-11-14 17:27:27,

Converted 'data\edgar_documents\PFE\10-Q_2025-11-04' --> 'data\processed_data\PFE\10-Q_2025-11-04.md'
Converted 'data\edgar_documents\PFE\4_2023-01-03' --> 'data\processed_data\PFE\4_2023-01-03.md'
Converted 'data\edgar_documents\PFE\4_2023-01-13' --> 'data\processed_data\PFE\4_2023-01-13.md'


2025-11-14 17:27:27,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,102 - INFO - Going to convert document batch...
2025-11-14 17:27:27,103 - INFO - Processing document 4_2023-02-24
2025-11-14 17:27:27,133 - INFO - Finished converting document 4_2023-02-24 in 0.05 sec.
2025-11-14 17:27:27,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,228 - INFO - Going to convert document batch...
2025-11-14 17:27:27,229 - INFO - Processing document 4_2023-02-28
2025-11-14 17:27:27,260 - INFO - Finished converting document 4_2023-02-28 in 0.08 sec.


Converted 'data\edgar_documents\PFE\4_2023-02-21' --> 'data\processed_data\PFE\4_2023-02-21.md'
Converted 'data\edgar_documents\PFE\4_2023-02-24' --> 'data\processed_data\PFE\4_2023-02-24.md'


2025-11-14 17:27:27,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,308 - INFO - Going to convert document batch...
2025-11-14 17:27:27,309 - INFO - Processing document 4_2023-03-17
2025-11-14 17:27:27,330 - INFO - Finished converting document 4_2023-03-17 in 0.05 sec.
2025-11-14 17:27:27,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,377 - INFO - Going to convert document batch...
2025-11-14 17:27:27,377 - INFO - Processing document 4_2023-03-21
2025-11-14 17:27:27,408 - INFO - Finished converting document 4_2023-03-21 in 0.06 sec.
2025-11-14 17:27:27,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\4_2023-02-28' --> 'data\processed_data\PFE\4_2023-02-28.md'
Converted 'data\edgar_documents\PFE\4_2023-03-17' --> 'data\processed_data\PFE\4_2023-03-17.md'
Converted 'data\edgar_documents\PFE\4_2023-03-21' --> 'data\processed_data\PFE\4_2023-03-21.md'


2025-11-14 17:27:27,485 - INFO - Going to convert document batch...
2025-11-14 17:27:27,487 - INFO - Processing document 4_2023-03-23
2025-11-14 17:27:27,524 - INFO - Finished converting document 4_2023-03-23 in 0.08 sec.
2025-11-14 17:27:27,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,580 - INFO - Going to convert document batch...
2025-11-14 17:27:27,581 - INFO - Processing document 4_2023-04-03
2025-11-14 17:27:27,602 - INFO - Finished converting document 4_2023-04-03 in 0.03 sec.
2025-11-14 17:27:27,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,652 - INFO - Going to convert document batch...
2025-11-14 17:27:27,654 - INFO - Processing document 4_2023-04-04
2025-11-14 17:27:27,677 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.
2025-11-14 17:27:27,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,738 - INFO - Going to convert document batch...
2025-11-14 17:27:27,739 - 

Converted 'data\edgar_documents\PFE\4_2023-03-23' --> 'data\processed_data\PFE\4_2023-03-23.md'
Converted 'data\edgar_documents\PFE\4_2023-04-03' --> 'data\processed_data\PFE\4_2023-04-03.md'
Converted 'data\edgar_documents\PFE\4_2023-04-04' --> 'data\processed_data\PFE\4_2023-04-04.md'


2025-11-14 17:27:27,759 - INFO - Finished converting document 4_2023-04-14 in 0.05 sec.
2025-11-14 17:27:27,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,807 - INFO - Going to convert document batch...
2025-11-14 17:27:27,808 - INFO - Processing document 4_2023-04-17
2025-11-14 17:27:27,830 - INFO - Finished converting document 4_2023-04-17 in 0.05 sec.
2025-11-14 17:27:27,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:27,914 - INFO - Going to convert document batch...
2025-11-14 17:27:27,915 - INFO - Processing document 4_2023-04-28
2025-11-14 17:27:27,943 - INFO - Finished converting document 4_2023-04-28 in 0.08 sec.
2025-11-14 17:27:27,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\4_2023-04-14' --> 'data\processed_data\PFE\4_2023-04-14.md'
Converted 'data\edgar_documents\PFE\4_2023-04-17' --> 'data\processed_data\PFE\4_2023-04-17.md'
Converted 'data\edgar_documents\PFE\4_2023-04-28' --> 'data\processed_data\PFE\4_2023-04-28.md'


2025-11-14 17:27:27,990 - INFO - Going to convert document batch...
2025-11-14 17:27:27,991 - INFO - Processing document 4_2023-05-01
2025-11-14 17:27:28,008 - INFO - Finished converting document 4_2023-05-01 in 0.03 sec.
2025-11-14 17:27:28,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:28,054 - INFO - Going to convert document batch...
2025-11-14 17:27:28,055 - INFO - Processing document 4_2023-05-09


Converted 'data\edgar_documents\PFE\4_2023-05-01' --> 'data\processed_data\PFE\4_2023-05-01.md'


2025-11-14 17:27:28,542 - INFO - Finished converting document 4_2023-05-09 in 0.52 sec.
2025-11-14 17:27:28,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:28,587 - INFO - Going to convert document batch...
2025-11-14 17:27:28,588 - INFO - Processing document 4_2023-05-11
2025-11-14 17:27:28,608 - INFO - Finished converting document 4_2023-05-11 in 0.05 sec.
2025-11-14 17:27:28,655 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:27:28,655 - ERROR - Input document 4_2023-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\PFE\4_2023-05-09' --> 'data\processed_data\PFE\4_2023-05-09.md'
Converted 'data\edgar_documents\PFE\4_2023-05-11' --> 'data\processed_data\PFE\4_2023-05-11.md'
Error processing data\edgar_documents\PFE\4_2023-05-15: File format not allowed: data\edgar_documents\PFE\4_2023-05-15
Converted 'data\edgar_documents\PFE\4_2023-05-16' --> 'data\processed_data\PFE\4_2023-05-16.md'
Error processing data\edgar_documents\PFE\4_2023-05-18: File format not allowed: data\edgar_documents\PFE\4_2023-05-18


2025-11-14 17:27:28,760 - INFO - Going to convert document batch...
2025-11-14 17:27:28,761 - INFO - Processing document 4_2023-06-01
2025-11-14 17:27:28,780 - INFO - Finished converting document 4_2023-06-01 in 0.05 sec.
2025-11-14 17:27:28,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:28,829 - INFO - Going to convert document batch...
2025-11-14 17:27:28,830 - INFO - Processing document 4_2023-06-16
2025-11-14 17:27:28,851 - INFO - Finished converting document 4_2023-06-16 in 0.03 sec.
2025-11-14 17:27:28,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:28,900 - INFO - Going to convert document batch...
2025-11-14 17:27:28,900 - INFO - Processing document 4_2023-07-03
2025-11-14 17:27:28,918 - INFO - Finished converting document 4_2023-07-03 in 0.05 sec.
2025-11-14 17:27:28,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:28,963 - INFO - Going to convert document batch...
2025-11-14 17:27:28,963 - 

Converted 'data\edgar_documents\PFE\4_2023-06-01' --> 'data\processed_data\PFE\4_2023-06-01.md'
Converted 'data\edgar_documents\PFE\4_2023-06-16' --> 'data\processed_data\PFE\4_2023-06-16.md'
Converted 'data\edgar_documents\PFE\4_2023-07-03' --> 'data\processed_data\PFE\4_2023-07-03.md'


2025-11-14 17:27:29,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,028 - INFO - Going to convert document batch...
2025-11-14 17:27:29,029 - INFO - Processing document 4_2023-07-17
2025-11-14 17:27:29,061 - INFO - Finished converting document 4_2023-07-17 in 0.06 sec.
2025-11-14 17:27:29,114 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,122 - INFO - Going to convert document batch...
2025-11-14 17:27:29,123 - INFO - Processing document 4_2023-08-01
2025-11-14 17:27:29,146 - INFO - Finished converting document 4_2023-08-01 in 0.05 sec.
2025-11-14 17:27:29,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,189 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PFE\4_2023-07-05' --> 'data\processed_data\PFE\4_2023-07-05.md'
Converted 'data\edgar_documents\PFE\4_2023-07-17' --> 'data\processed_data\PFE\4_2023-07-17.md'
Converted 'data\edgar_documents\PFE\4_2023-08-01' --> 'data\processed_data\PFE\4_2023-08-01.md'


2025-11-14 17:27:29,190 - INFO - Processing document 4_2023-08-16
2025-11-14 17:27:29,208 - INFO - Finished converting document 4_2023-08-16 in 0.03 sec.
2025-11-14 17:27:29,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,273 - INFO - Going to convert document batch...
2025-11-14 17:27:29,275 - INFO - Processing document 4_2023-09-01
2025-11-14 17:27:29,307 - INFO - Finished converting document 4_2023-09-01 in 0.08 sec.
2025-11-14 17:27:29,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,351 - INFO - Going to convert document batch...
2025-11-14 17:27:29,352 - INFO - Processing document 4_2023-09-18
2025-11-14 17:27:29,373 - INFO - Finished converting document 4_2023-09-18 in 0.05 sec.
2025-11-14 17:27:29,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\4_2023-08-16' --> 'data\processed_data\PFE\4_2023-08-16.md'
Converted 'data\edgar_documents\PFE\4_2023-09-01' --> 'data\processed_data\PFE\4_2023-09-01.md'
Converted 'data\edgar_documents\PFE\4_2023-09-18' --> 'data\processed_data\PFE\4_2023-09-18.md'


2025-11-14 17:27:29,427 - INFO - Going to convert document batch...
2025-11-14 17:27:29,429 - INFO - Processing document 4_2023-10-02
2025-11-14 17:27:29,446 - INFO - Finished converting document 4_2023-10-02 in 0.05 sec.
2025-11-14 17:27:29,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,490 - INFO - Going to convert document batch...
2025-11-14 17:27:29,491 - INFO - Processing document 4_2023-10-12
2025-11-14 17:27:29,509 - INFO - Finished converting document 4_2023-10-12 in 0.03 sec.
2025-11-14 17:27:29,540 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,548 - INFO - Going to convert document batch...
2025-11-14 17:27:29,549 - INFO - Processing document 4_2023-10-16
2025-11-14 17:27:29,568 - INFO - Finished converting document 4_2023-10-16 in 0.03 sec.
2025-11-14 17:27:29,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,631 - INFO - Going to convert document batch...
2025-11-14 17:27:29,632 - 

Converted 'data\edgar_documents\PFE\4_2023-10-02' --> 'data\processed_data\PFE\4_2023-10-02.md'
Converted 'data\edgar_documents\PFE\4_2023-10-12' --> 'data\processed_data\PFE\4_2023-10-12.md'
Converted 'data\edgar_documents\PFE\4_2023-10-16' --> 'data\processed_data\PFE\4_2023-10-16.md'


2025-11-14 17:27:29,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,690 - INFO - Going to convert document batch...
2025-11-14 17:27:29,690 - INFO - Processing document 4_2023-11-16
2025-11-14 17:27:29,710 - INFO - Finished converting document 4_2023-11-16 in 0.03 sec.
2025-11-14 17:27:29,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,752 - INFO - Going to convert document batch...
2025-11-14 17:27:29,754 - INFO - Processing document 4_2023-12-04
2025-11-14 17:27:29,774 - INFO - Finished converting document 4_2023-12-04 in 0.03 sec.
2025-11-14 17:27:29,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,812 - INFO - Going to convert document batch...
2025-11-14 17:27:29,813 - INFO - Processing document 4_2023-12-19
2025-11-14 17:27:29,833 - INFO - Finished converting document 4_2023-12-19 in 0.03 sec.
2025-11-14 17:27:29,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\4_2023-11-01' --> 'data\processed_data\PFE\4_2023-11-01.md'
Converted 'data\edgar_documents\PFE\4_2023-11-16' --> 'data\processed_data\PFE\4_2023-11-16.md'
Converted 'data\edgar_documents\PFE\4_2023-12-04' --> 'data\processed_data\PFE\4_2023-12-04.md'
Converted 'data\edgar_documents\PFE\4_2023-12-19' --> 'data\processed_data\PFE\4_2023-12-19.md'


2025-11-14 17:27:29,875 - INFO - Going to convert document batch...
2025-11-14 17:27:29,876 - INFO - Processing document 4_2023-12-29
2025-11-14 17:27:29,894 - INFO - Finished converting document 4_2023-12-29 in 0.05 sec.
2025-11-14 17:27:29,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:29,938 - INFO - Going to convert document batch...
2025-11-14 17:27:29,939 - INFO - Processing document 4_2024-01-02
2025-11-14 17:27:29,958 - INFO - Finished converting document 4_2024-01-02 in 0.03 sec.
2025-11-14 17:27:29,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,001 - INFO - Going to convert document batch...
2025-11-14 17:27:30,002 - INFO - Processing document 4_2024-01-12
2025-11-14 17:27:30,021 - INFO - Finished converting document 4_2024-01-12 in 0.03 sec.
2025-11-14 17:27:30,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,084 - INFO - Going to convert document batch...
2025-11-14 17:27:30,084 - 

Converted 'data\edgar_documents\PFE\4_2023-12-29' --> 'data\processed_data\PFE\4_2023-12-29.md'
Converted 'data\edgar_documents\PFE\4_2024-01-02' --> 'data\processed_data\PFE\4_2024-01-02.md'
Converted 'data\edgar_documents\PFE\4_2024-01-12' --> 'data\processed_data\PFE\4_2024-01-12.md'
Converted 'data\edgar_documents\PFE\4_2024-02-16' --> 'data\processed_data\PFE\4_2024-02-16.md'


2025-11-14 17:27:30,144 - INFO - Going to convert document batch...
2025-11-14 17:27:30,145 - INFO - Processing document 4_2024-02-27
2025-11-14 17:27:30,173 - INFO - Finished converting document 4_2024-02-27 in 0.05 sec.
2025-11-14 17:27:30,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,223 - INFO - Going to convert document batch...
2025-11-14 17:27:30,223 - INFO - Processing document 4_2024-02-28
2025-11-14 17:27:30,244 - INFO - Finished converting document 4_2024-02-28 in 0.03 sec.
2025-11-14 17:27:30,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,313 - INFO - Going to convert document batch...
2025-11-14 17:27:30,314 - INFO - Processing document 4_2024-02-29
2025-11-14 17:27:30,337 - INFO - Finished converting document 4_2024-02-29 in 0.06 sec.
2025-11-14 17:27:30,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,377 - INFO - Going to convert document batch...
2025-11-14 17:27:30,379 - 

Converted 'data\edgar_documents\PFE\4_2024-02-27' --> 'data\processed_data\PFE\4_2024-02-27.md'
Converted 'data\edgar_documents\PFE\4_2024-02-28' --> 'data\processed_data\PFE\4_2024-02-28.md'
Converted 'data\edgar_documents\PFE\4_2024-02-29' --> 'data\processed_data\PFE\4_2024-02-29.md'


2025-11-14 17:27:30,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,442 - INFO - Going to convert document batch...
2025-11-14 17:27:30,443 - INFO - Processing document 4_2024-03-05
2025-11-14 17:27:30,463 - INFO - Finished converting document 4_2024-03-05 in 0.03 sec.
2025-11-14 17:27:30,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,504 - INFO - Going to convert document batch...
2025-11-14 17:27:30,506 - INFO - Processing document 4_2024-03-18
2025-11-14 17:27:30,523 - INFO - Finished converting document 4_2024-03-18 in 0.03 sec.
2025-11-14 17:27:30,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,581 - INFO - Going to convert document batch...
2025-11-14 17:27:30,582 - INFO - Processing document 4_2024-04-01
2025-11-14 17:27:30,599 - INFO - Finished converting document 4_2024-04-01 in 0.05 sec.


Converted 'data\edgar_documents\PFE\4_2024-03-01' --> 'data\processed_data\PFE\4_2024-03-01.md'
Converted 'data\edgar_documents\PFE\4_2024-03-05' --> 'data\processed_data\PFE\4_2024-03-05.md'
Converted 'data\edgar_documents\PFE\4_2024-03-18' --> 'data\processed_data\PFE\4_2024-03-18.md'
Converted 'data\edgar_documents\PFE\4_2024-04-01' --> 'data\processed_data\PFE\4_2024-04-01.md'


2025-11-14 17:27:30,648 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,662 - INFO - Going to convert document batch...
2025-11-14 17:27:30,664 - INFO - Processing document 4_2024-04-11
2025-11-14 17:27:30,682 - INFO - Finished converting document 4_2024-04-11 in 0.06 sec.
2025-11-14 17:27:30,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,726 - INFO - Going to convert document batch...
2025-11-14 17:27:30,727 - INFO - Processing document 4_2024-04-16
2025-11-14 17:27:30,745 - INFO - Finished converting document 4_2024-04-16 in 0.05 sec.
2025-11-14 17:27:30,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,783 - INFO - Going to convert document batch...
2025-11-14 17:27:30,784 - INFO - Processing document 4_2024-04-26
2025-11-14 17:27:30,804 - INFO - Finished converting document 4_2024-04-26 in 0.03 sec.
2025-11-14 17:27:30,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\PFE\4_2024-04-11' --> 'data\processed_data\PFE\4_2024-04-11.md'
Converted 'data\edgar_documents\PFE\4_2024-04-16' --> 'data\processed_data\PFE\4_2024-04-16.md'
Converted 'data\edgar_documents\PFE\4_2024-04-26' --> 'data\processed_data\PFE\4_2024-04-26.md'
Converted 'data\edgar_documents\PFE\4_2024-05-01' --> 'data\processed_data\PFE\4_2024-05-01.md'


2025-11-14 17:27:30,900 - INFO - Going to convert document batch...
2025-11-14 17:27:30,901 - INFO - Processing document 4_2024-05-16
2025-11-14 17:27:30,920 - INFO - Finished converting document 4_2024-05-16 in 0.05 sec.
2025-11-14 17:27:30,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:30,961 - INFO - Going to convert document batch...
2025-11-14 17:27:30,962 - INFO - Processing document 4_2024-06-03
2025-11-14 17:27:30,981 - INFO - Finished converting document 4_2024-06-03 in 0.05 sec.
2025-11-14 17:27:31,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,036 - INFO - Going to convert document batch...
2025-11-14 17:27:31,037 - INFO - Processing document 4_2024-06-04
2025-11-14 17:27:31,055 - INFO - Finished converting document 4_2024-06-04 in 0.05 sec.
2025-11-14 17:27:31,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,112 - INFO - Going to convert document batch...
2025-11-14 17:27:31,113 - 

Converted 'data\edgar_documents\PFE\4_2024-05-16' --> 'data\processed_data\PFE\4_2024-05-16.md'
Converted 'data\edgar_documents\PFE\4_2024-06-03' --> 'data\processed_data\PFE\4_2024-06-03.md'
Converted 'data\edgar_documents\PFE\4_2024-06-04' --> 'data\processed_data\PFE\4_2024-06-04.md'


2025-11-14 17:27:31,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,167 - INFO - Going to convert document batch...
2025-11-14 17:27:31,168 - INFO - Processing document 4_2024-07-01
2025-11-14 17:27:31,188 - INFO - Finished converting document 4_2024-07-01 in 0.05 sec.
2025-11-14 17:27:31,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,247 - INFO - Going to convert document batch...
2025-11-14 17:27:31,248 - INFO - Processing document 4_2024-07-12
2025-11-14 17:27:31,276 - INFO - Finished converting document 4_2024-07-12 in 0.06 sec.
2025-11-14 17:27:31,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\4_2024-06-17' --> 'data\processed_data\PFE\4_2024-06-17.md'
Converted 'data\edgar_documents\PFE\4_2024-07-01' --> 'data\processed_data\PFE\4_2024-07-01.md'
Converted 'data\edgar_documents\PFE\4_2024-07-12' --> 'data\processed_data\PFE\4_2024-07-12.md'


2025-11-14 17:27:31,333 - INFO - Going to convert document batch...
2025-11-14 17:27:31,334 - INFO - Processing document 4_2024-07-16
2025-11-14 17:27:31,356 - INFO - Finished converting document 4_2024-07-16 in 0.06 sec.
2025-11-14 17:27:31,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,403 - INFO - Going to convert document batch...
2025-11-14 17:27:31,405 - INFO - Processing document 4_2024-08-02
2025-11-14 17:27:31,423 - INFO - Finished converting document 4_2024-08-02 in 0.05 sec.
2025-11-14 17:27:31,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,464 - INFO - Going to convert document batch...
2025-11-14 17:27:31,465 - INFO - Processing document 4_2024-08-05
2025-11-14 17:27:31,482 - INFO - Finished converting document 4_2024-08-05 in 0.05 sec.
2025-11-14 17:27:31,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,520 - INFO - Going to convert document batch...
2025-11-14 17:27:31,521 - 

Converted 'data\edgar_documents\PFE\4_2024-07-16' --> 'data\processed_data\PFE\4_2024-07-16.md'
Converted 'data\edgar_documents\PFE\4_2024-08-02' --> 'data\processed_data\PFE\4_2024-08-02.md'
Converted 'data\edgar_documents\PFE\4_2024-08-05' --> 'data\processed_data\PFE\4_2024-08-05.md'


2025-11-14 17:27:31,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,597 - INFO - Going to convert document batch...
2025-11-14 17:27:31,598 - INFO - Processing document 4_2024-08-16
2025-11-14 17:27:31,634 - INFO - Finished converting document 4_2024-08-16 in 0.06 sec.
2025-11-14 17:27:31,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,697 - INFO - Going to convert document batch...
2025-11-14 17:27:31,698 - INFO - Processing document 4_2024-09-03
2025-11-14 17:27:31,727 - INFO - Finished converting document 4_2024-09-03 in 0.06 sec.


Converted 'data\edgar_documents\PFE\4_2024-08-14' --> 'data\processed_data\PFE\4_2024-08-14.md'
Converted 'data\edgar_documents\PFE\4_2024-08-16' --> 'data\processed_data\PFE\4_2024-08-16.md'


2025-11-14 17:27:31,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,772 - INFO - Going to convert document batch...
2025-11-14 17:27:31,772 - INFO - Processing document 4_2024-09-16
2025-11-14 17:27:31,800 - INFO - Finished converting document 4_2024-09-16 in 0.05 sec.
2025-11-14 17:27:31,843 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,850 - INFO - Going to convert document batch...
2025-11-14 17:27:31,851 - INFO - Processing document 4_2024-10-02
2025-11-14 17:27:31,870 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.
2025-11-14 17:27:31,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,908 - INFO - Going to convert document batch...
2025-11-14 17:27:31,909 - INFO - Processing document 4_2024-10-11
2025-11-14 17:27:31,929 - INFO - Finished converting document 4_2024-10-11 in 0.03 sec.


Converted 'data\edgar_documents\PFE\4_2024-09-03' --> 'data\processed_data\PFE\4_2024-09-03.md'
Converted 'data\edgar_documents\PFE\4_2024-09-16' --> 'data\processed_data\PFE\4_2024-09-16.md'
Converted 'data\edgar_documents\PFE\4_2024-10-02' --> 'data\processed_data\PFE\4_2024-10-02.md'


2025-11-14 17:27:31,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:31,971 - INFO - Going to convert document batch...
2025-11-14 17:27:31,972 - INFO - Processing document 4_2024-10-15
2025-11-14 17:27:31,995 - INFO - Finished converting document 4_2024-10-15 in 0.05 sec.
2025-11-14 17:27:32,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,056 - INFO - Going to convert document batch...
2025-11-14 17:27:32,057 - INFO - Processing document 4_2024-10-16
2025-11-14 17:27:32,075 - INFO - Finished converting document 4_2024-10-16 in 0.06 sec.
2025-11-14 17:27:32,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,136 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PFE\4_2024-10-11' --> 'data\processed_data\PFE\4_2024-10-11.md'
Converted 'data\edgar_documents\PFE\4_2024-10-15' --> 'data\processed_data\PFE\4_2024-10-15.md'
Converted 'data\edgar_documents\PFE\4_2024-10-16' --> 'data\processed_data\PFE\4_2024-10-16.md'


2025-11-14 17:27:32,137 - INFO - Processing document 4_2024-10-31
2025-11-14 17:27:32,155 - INFO - Finished converting document 4_2024-10-31 in 0.06 sec.
2025-11-14 17:27:32,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,208 - INFO - Going to convert document batch...
2025-11-14 17:27:32,209 - INFO - Processing document 4_2024-11-01
2025-11-14 17:27:32,243 - INFO - Finished converting document 4_2024-11-01 in 0.06 sec.
2025-11-14 17:27:32,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,290 - INFO - Going to convert document batch...
2025-11-14 17:27:32,291 - INFO - Processing document 4_2024-11-18
2025-11-14 17:27:32,310 - INFO - Finished converting document 4_2024-11-18 in 0.05 sec.
2025-11-14 17:27:32,354 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\4_2024-10-31' --> 'data\processed_data\PFE\4_2024-10-31.md'
Converted 'data\edgar_documents\PFE\4_2024-11-01' --> 'data\processed_data\PFE\4_2024-11-01.md'
Converted 'data\edgar_documents\PFE\4_2024-11-18' --> 'data\processed_data\PFE\4_2024-11-18.md'


2025-11-14 17:27:32,363 - INFO - Going to convert document batch...
2025-11-14 17:27:32,364 - INFO - Processing document 4_2024-12-02
2025-11-14 17:27:32,383 - INFO - Finished converting document 4_2024-12-02 in 0.05 sec.
2025-11-14 17:27:32,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,426 - INFO - Going to convert document batch...
2025-11-14 17:27:32,426 - INFO - Processing document 4_2024-12-17
2025-11-14 17:27:32,447 - INFO - Finished converting document 4_2024-12-17 in 0.03 sec.
2025-11-14 17:27:32,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,486 - INFO - Going to convert document batch...
2025-11-14 17:27:32,487 - INFO - Processing document 4_2025-01-03
2025-11-14 17:27:32,503 - INFO - Finished converting document 4_2025-01-03 in 0.03 sec.
2025-11-14 17:27:32,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,566 - INFO - Going to convert document batch...
2025-11-14 17:27:32,567 - 

Converted 'data\edgar_documents\PFE\4_2024-12-02' --> 'data\processed_data\PFE\4_2024-12-02.md'
Converted 'data\edgar_documents\PFE\4_2024-12-17' --> 'data\processed_data\PFE\4_2024-12-17.md'
Converted 'data\edgar_documents\PFE\4_2025-01-03' --> 'data\processed_data\PFE\4_2025-01-03.md'


2025-11-14 17:27:32,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,630 - INFO - Going to convert document batch...
2025-11-14 17:27:32,631 - INFO - Processing document 4_2025-02-04
2025-11-14 17:27:32,651 - INFO - Finished converting document 4_2025-02-04 in 0.05 sec.
2025-11-14 17:27:32,696 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,705 - INFO - Going to convert document batch...
2025-11-14 17:27:32,707 - INFO - Processing document 4_2025-02-14
2025-11-14 17:27:32,738 - INFO - Finished converting document 4_2025-02-14 in 0.06 sec.
2025-11-14 17:27:32,779 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,787 - INFO - Going to convert document batch...
2025-11-14 17:27:32,788 - INFO - Processing document 4_2025-02-18
2025-11-14 17:27:32,810 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.


Converted 'data\edgar_documents\PFE\4_2025-01-15' --> 'data\processed_data\PFE\4_2025-01-15.md'
Converted 'data\edgar_documents\PFE\4_2025-02-04' --> 'data\processed_data\PFE\4_2025-02-04.md'
Converted 'data\edgar_documents\PFE\4_2025-02-14' --> 'data\processed_data\PFE\4_2025-02-14.md'


2025-11-14 17:27:32,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,862 - INFO - Going to convert document batch...
2025-11-14 17:27:32,863 - INFO - Processing document 4_2025-02-25
2025-11-14 17:27:32,891 - INFO - Finished converting document 4_2025-02-25 in 0.06 sec.
2025-11-14 17:27:32,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:32,942 - INFO - Going to convert document batch...
2025-11-14 17:27:32,943 - INFO - Processing document 4_2025-02-28
2025-11-14 17:27:32,968 - INFO - Finished converting document 4_2025-02-28 in 0.05 sec.
2025-11-14 17:27:33,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\4_2025-02-18' --> 'data\processed_data\PFE\4_2025-02-18.md'
Converted 'data\edgar_documents\PFE\4_2025-02-25' --> 'data\processed_data\PFE\4_2025-02-25.md'
Converted 'data\edgar_documents\PFE\4_2025-02-28' --> 'data\processed_data\PFE\4_2025-02-28.md'


2025-11-14 17:27:33,025 - INFO - Going to convert document batch...
2025-11-14 17:27:33,026 - INFO - Processing document 4_2025-03-03
2025-11-14 17:27:33,052 - INFO - Finished converting document 4_2025-03-03 in 0.05 sec.
2025-11-14 17:27:33,097 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:33,115 - INFO - Going to convert document batch...
2025-11-14 17:27:33,117 - INFO - Processing document 4_2025-03-06
2025-11-14 17:27:33,145 - INFO - Finished converting document 4_2025-03-06 in 0.06 sec.
2025-11-14 17:27:33,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:33,189 - INFO - Going to convert document batch...
2025-11-14 17:27:33,190 - INFO - Processing document 4_2025-03-18
2025-11-14 17:27:33,210 - INFO - Finished converting document 4_2025-03-18 in 0.03 sec.
2025-11-14 17:27:33,244 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:33,252 - INFO - Going to convert document batch...
2025-11-14 17:27:33,253 - 

Converted 'data\edgar_documents\PFE\4_2025-03-03' --> 'data\processed_data\PFE\4_2025-03-03.md'
Converted 'data\edgar_documents\PFE\4_2025-03-06' --> 'data\processed_data\PFE\4_2025-03-06.md'
Converted 'data\edgar_documents\PFE\4_2025-03-18' --> 'data\processed_data\PFE\4_2025-03-18.md'


2025-11-14 17:27:33,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:33,542 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PFE\4_2025-04-02' --> 'data\processed_data\PFE\4_2025-04-02.md'


2025-11-14 17:27:33,543 - INFO - Processing document 4_2025-04-14
2025-11-14 17:27:33,562 - INFO - Finished converting document 4_2025-04-14 in 0.27 sec.
2025-11-14 17:27:33,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:33,604 - INFO - Going to convert document batch...
2025-11-14 17:27:33,605 - INFO - Processing document 4_2025-04-17
2025-11-14 17:27:33,626 - INFO - Finished converting document 4_2025-04-17 in 0.05 sec.
2025-11-14 17:27:33,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:33,669 - INFO - Going to convert document batch...
2025-11-14 17:27:33,670 - INFO - Processing document 4_2025-04-28
2025-11-14 17:27:33,692 - INFO - Finished converting document 4_2025-04-28 in 0.05 sec.
2025-11-14 17:27:33,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:33,729 - INFO - Going to convert document batch...
2025-11-14 17:27:33,730 - INFO - Processing document 4_2025-05-02
2025-11-14 17:27:33,748 - IN

Converted 'data\edgar_documents\PFE\4_2025-04-14' --> 'data\processed_data\PFE\4_2025-04-14.md'
Converted 'data\edgar_documents\PFE\4_2025-04-17' --> 'data\processed_data\PFE\4_2025-04-17.md'
Converted 'data\edgar_documents\PFE\4_2025-04-28' --> 'data\processed_data\PFE\4_2025-04-28.md'


2025-11-14 17:27:33,792 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:27:33,793 - ERROR - Input document 4_2025-05-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:27:33,794 - INFO - Going to convert document batch...
2025-11-14 17:27:33,817 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:27:33,819 - ERROR - Input document 4_2025-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\PFE\4_2025-05-02' --> 'data\processed_data\PFE\4_2025-05-02.md'
Error processing data\edgar_documents\PFE\4_2025-05-13: File format not allowed: data\edgar_documents\PFE\4_2025-05-13
Error processing data\edgar_documents\PFE\4_2025-05-15: File format not allowed: data\edgar_documents\PFE\4_2025-05-15
Converted 'data\edgar_documents\PFE\4_2025-05-19' --> 'data\processed_data\PFE\4_2025-05-19.md'


2025-11-14 17:27:33,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:33,980 - INFO - Going to convert document batch...
2025-11-14 17:27:33,981 - INFO - Processing document 4_2025-06-17
2025-11-14 17:27:34,003 - INFO - Finished converting document 4_2025-06-17 in 0.05 sec.
2025-11-14 17:27:34,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,045 - INFO - Going to convert document batch...
2025-11-14 17:27:34,046 - INFO - Processing document 4_2025-07-02
2025-11-14 17:27:34,065 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 17:27:34,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,105 - INFO - Going to convert document batch...
2025-11-14 17:27:34,106 - INFO - Processing document 4_2025-07-16
2025-11-14 17:27:34,126 - INFO - Finished converting document 4_2025-07-16 in 0.05 sec.
2025-11-14 17:27:34,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\4_2025-06-03' --> 'data\processed_data\PFE\4_2025-06-03.md'
Converted 'data\edgar_documents\PFE\4_2025-06-17' --> 'data\processed_data\PFE\4_2025-06-17.md'
Converted 'data\edgar_documents\PFE\4_2025-07-02' --> 'data\processed_data\PFE\4_2025-07-02.md'
Converted 'data\edgar_documents\PFE\4_2025-07-16' --> 'data\processed_data\PFE\4_2025-07-16.md'


2025-11-14 17:27:34,167 - INFO - Going to convert document batch...
2025-11-14 17:27:34,168 - INFO - Processing document 4_2025-08-04
2025-11-14 17:27:34,187 - INFO - Finished converting document 4_2025-08-04 in 0.05 sec.
2025-11-14 17:27:34,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,250 - INFO - Going to convert document batch...
2025-11-14 17:27:34,251 - INFO - Processing document 4_2025-08-19
2025-11-14 17:27:34,275 - INFO - Finished converting document 4_2025-08-19 in 0.05 sec.
2025-11-14 17:27:34,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,315 - INFO - Going to convert document batch...
2025-11-14 17:27:34,316 - INFO - Processing document 4_2025-09-03
2025-11-14 17:27:34,337 - INFO - Finished converting document 4_2025-09-03 in 0.03 sec.
2025-11-14 17:27:34,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,379 - INFO - Going to convert document batch...
2025-11-14 17:27:34,379 - 

Converted 'data\edgar_documents\PFE\4_2025-08-04' --> 'data\processed_data\PFE\4_2025-08-04.md'
Converted 'data\edgar_documents\PFE\4_2025-08-19' --> 'data\processed_data\PFE\4_2025-08-19.md'
Converted 'data\edgar_documents\PFE\4_2025-09-03' --> 'data\processed_data\PFE\4_2025-09-03.md'
Converted 'data\edgar_documents\PFE\4_2025-09-17' --> 'data\processed_data\PFE\4_2025-09-17.md'


2025-11-14 17:27:34,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,454 - INFO - Going to convert document batch...
2025-11-14 17:27:34,455 - INFO - Processing document 4_2025-10-02
2025-11-14 17:27:34,474 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 17:27:34,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,517 - INFO - Going to convert document batch...
2025-11-14 17:27:34,518 - INFO - Processing document 4_2025-10-16
2025-11-14 17:27:34,538 - INFO - Finished converting document 4_2025-10-16 in 0.03 sec.
2025-11-14 17:27:34,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,615 - INFO - Going to convert document batch...
2025-11-14 17:27:34,616 - INFO - Processing document 4_2025-10-17
2025-11-14 17:27:34,636 - INFO - Finished converting document 4_2025-10-17 in 0.06 sec.
2025-11-14 17:27:34,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\4_2025-10-02' --> 'data\processed_data\PFE\4_2025-10-02.md'
Converted 'data\edgar_documents\PFE\4_2025-10-16' --> 'data\processed_data\PFE\4_2025-10-16.md'
Converted 'data\edgar_documents\PFE\4_2025-10-17' --> 'data\processed_data\PFE\4_2025-10-17.md'


2025-11-14 17:27:34,692 - INFO - Going to convert document batch...
2025-11-14 17:27:34,692 - INFO - Processing document 4_2025-11-03
2025-11-14 17:27:34,712 - INFO - Finished converting document 4_2025-11-03 in 0.05 sec.
2025-11-14 17:27:34,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,768 - INFO - Going to convert document batch...
2025-11-14 17:27:34,769 - INFO - Processing document 8-K_2023-01-31
2025-11-14 17:27:34,790 - INFO - Finished converting document 8-K_2023-01-31 in 0.05 sec.
2025-11-14 17:27:34,816 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,831 - INFO - Going to convert document batch...
2025-11-14 17:27:34,832 - INFO - Processing document 8-K_2023-02-21
2025-11-14 17:27:34,851 - INFO - Finished converting document 8-K_2023-02-21 in 0.05 sec.
2025-11-14 17:27:34,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,893 - INFO - Going to convert document batch...
2025-11-14 17:27:3

Converted 'data\edgar_documents\PFE\4_2025-11-03' --> 'data\processed_data\PFE\4_2025-11-03.md'
Converted 'data\edgar_documents\PFE\8-K_2023-01-31' --> 'data\processed_data\PFE\8-K_2023-01-31.md'
Converted 'data\edgar_documents\PFE\8-K_2023-02-21' --> 'data\processed_data\PFE\8-K_2023-02-21.md'


2025-11-14 17:27:34,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:34,974 - INFO - Going to convert document batch...
2025-11-14 17:27:34,975 - INFO - Processing document 8-K_2023-05-01
2025-11-14 17:27:35,028 - INFO - Finished converting document 8-K_2023-05-01 in 0.11 sec.
2025-11-14 17:27:35,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\8-K_2023-03-13' --> 'data\processed_data\PFE\8-K_2023-03-13.md'
Converted 'data\edgar_documents\PFE\8-K_2023-05-01' --> 'data\processed_data\PFE\8-K_2023-05-01.md'


2025-11-14 17:27:35,122 - INFO - Going to convert document batch...
2025-11-14 17:27:35,123 - INFO - Processing document 8-K_2023-05-02
2025-11-14 17:27:35,145 - INFO - Finished converting document 8-K_2023-05-02 in 0.05 sec.
2025-11-14 17:27:35,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,185 - INFO - Going to convert document batch...
2025-11-14 17:27:35,186 - INFO - Processing document 8-K_2023-05-15
2025-11-14 17:27:35,198 - INFO - Finished converting document 8-K_2023-05-15 in 0.05 sec.
2025-11-14 17:27:35,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,239 - INFO - Going to convert document batch...
2025-11-14 17:27:35,240 - INFO - Processing document 8-K_2023-05-19
2025-11-14 17:27:35,270 - INFO - Finished converting document 8-K_2023-05-19 in 0.06 sec.
2025-11-14 17:27:35,296 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,312 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\PFE\8-K_2023-05-02' --> 'data\processed_data\PFE\8-K_2023-05-02.md'
Converted 'data\edgar_documents\PFE\8-K_2023-05-15' --> 'data\processed_data\PFE\8-K_2023-05-15.md'
Converted 'data\edgar_documents\PFE\8-K_2023-05-19' --> 'data\processed_data\PFE\8-K_2023-05-19.md'


2025-11-14 17:27:35,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,377 - INFO - Going to convert document batch...
2025-11-14 17:27:35,378 - INFO - Processing document 8-K_2023-08-01
2025-11-14 17:27:35,402 - INFO - Finished converting document 8-K_2023-08-01 in 0.06 sec.
2025-11-14 17:27:35,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,448 - INFO - Going to convert document batch...
2025-11-14 17:27:35,448 - INFO - Processing document 8-K_2023-10-13
2025-11-14 17:27:35,477 - INFO - Finished converting document 8-K_2023-10-13 in 0.05 sec.
2025-11-14 17:27:35,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\8-K_2023-07-27' --> 'data\processed_data\PFE\8-K_2023-07-27.md'
Converted 'data\edgar_documents\PFE\8-K_2023-08-01' --> 'data\processed_data\PFE\8-K_2023-08-01.md'
Converted 'data\edgar_documents\PFE\8-K_2023-10-13' --> 'data\processed_data\PFE\8-K_2023-10-13.md'


2025-11-14 17:27:35,552 - INFO - Going to convert document batch...
2025-11-14 17:27:35,553 - INFO - Processing document 8-K_2023-10-31
2025-11-14 17:27:35,575 - INFO - Finished converting document 8-K_2023-10-31 in 0.08 sec.
2025-11-14 17:27:35,601 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,618 - INFO - Going to convert document batch...
2025-11-14 17:27:35,618 - INFO - Processing document 8-K_2023-12-12
2025-11-14 17:27:35,643 - INFO - Finished converting document 8-K_2023-12-12 in 0.06 sec.
2025-11-14 17:27:35,680 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,693 - INFO - Going to convert document batch...
2025-11-14 17:27:35,694 - INFO - Processing document 8-K_2023-12-13
2025-11-14 17:27:35,715 - INFO - Finished converting document 8-K_2023-12-13 in 0.05 sec.
2025-11-14 17:27:35,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\8-K_2023-10-31' --> 'data\processed_data\PFE\8-K_2023-10-31.md'
Converted 'data\edgar_documents\PFE\8-K_2023-12-12' --> 'data\processed_data\PFE\8-K_2023-12-12.md'
Converted 'data\edgar_documents\PFE\8-K_2023-12-13' --> 'data\processed_data\PFE\8-K_2023-12-13.md'


2025-11-14 17:27:35,780 - INFO - Going to convert document batch...
2025-11-14 17:27:35,781 - INFO - Processing document 8-K_2023-12-14
2025-11-14 17:27:35,801 - INFO - Finished converting document 8-K_2023-12-14 in 0.06 sec.
2025-11-14 17:27:35,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,845 - INFO - Going to convert document batch...
2025-11-14 17:27:35,847 - INFO - Processing document 8-K_2024-01-10
2025-11-14 17:27:35,875 - INFO - Finished converting document 8-K_2024-01-10 in 0.06 sec.
2025-11-14 17:27:35,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,922 - INFO - Going to convert document batch...
2025-11-14 17:27:35,923 - INFO - Processing document 8-K_2024-01-30
2025-11-14 17:27:35,947 - INFO - Finished converting document 8-K_2024-01-30 in 0.05 sec.
2025-11-14 17:27:35,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:35,990 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\PFE\8-K_2023-12-14' --> 'data\processed_data\PFE\8-K_2023-12-14.md'
Converted 'data\edgar_documents\PFE\8-K_2024-01-10' --> 'data\processed_data\PFE\8-K_2024-01-10.md'
Converted 'data\edgar_documents\PFE\8-K_2024-01-30' --> 'data\processed_data\PFE\8-K_2024-01-30.md'


2025-11-14 17:27:36,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,112 - INFO - Going to convert document batch...
2025-11-14 17:27:36,113 - INFO - Processing document 8-K_2024-05-01
2025-11-14 17:27:36,135 - INFO - Finished converting document 8-K_2024-05-01 in 0.05 sec.
2025-11-14 17:27:36,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,171 - INFO - Going to convert document batch...
2025-11-14 17:27:36,171 - INFO - Processing document 8-K_2024-05-22
2025-11-14 17:27:36,189 - INFO - Finished converting document 8-K_2024-05-22 in 0.05 sec.
2025-11-14 17:27:36,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,220 - INFO - Going to convert document batch...
2025-11-14 17:27:36,221 - INFO - Processing document 8-K_2024-07-01
2025-11-14 17:27:36,241 - INFO - Finished converting document 8-K_2024-07-01 in 0.03 sec.
2025-11-14 17:27:36,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\PFE\8-K_2024-04-29' --> 'data\processed_data\PFE\8-K_2024-04-29.md'
Converted 'data\edgar_documents\PFE\8-K_2024-05-01' --> 'data\processed_data\PFE\8-K_2024-05-01.md'
Converted 'data\edgar_documents\PFE\8-K_2024-05-22' --> 'data\processed_data\PFE\8-K_2024-05-22.md'
Converted 'data\edgar_documents\PFE\8-K_2024-07-01' --> 'data\processed_data\PFE\8-K_2024-07-01.md'


2025-11-14 17:27:36,282 - INFO - Processing document 8-K_2024-07-10
2025-11-14 17:27:36,301 - INFO - Finished converting document 8-K_2024-07-10 in 0.05 sec.
2025-11-14 17:27:36,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,344 - INFO - Going to convert document batch...
2025-11-14 17:27:36,345 - INFO - Processing document 8-K_2024-07-26
2025-11-14 17:27:36,369 - INFO - Finished converting document 8-K_2024-07-26 in 0.05 sec.
2025-11-14 17:27:36,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,409 - INFO - Going to convert document batch...
2025-11-14 17:27:36,409 - INFO - Processing document 8-K_2024-07-30
2025-11-14 17:27:36,430 - INFO - Finished converting document 8-K_2024-07-30 in 0.03 sec.
2025-11-14 17:27:36,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,464 - INFO - Going to convert document batch...
2025-11-14 17:27:36,464 - INFO - Processing document 8-K_2024-10-15
2025-11-14 17:

Converted 'data\edgar_documents\PFE\8-K_2024-07-10' --> 'data\processed_data\PFE\8-K_2024-07-10.md'
Converted 'data\edgar_documents\PFE\8-K_2024-07-26' --> 'data\processed_data\PFE\8-K_2024-07-26.md'
Converted 'data\edgar_documents\PFE\8-K_2024-07-30' --> 'data\processed_data\PFE\8-K_2024-07-30.md'
Converted 'data\edgar_documents\PFE\8-K_2024-10-15' --> 'data\processed_data\PFE\8-K_2024-10-15.md'


2025-11-14 17:27:36,523 - INFO - Going to convert document batch...
2025-11-14 17:27:36,524 - INFO - Processing document 8-K_2024-10-29
2025-11-14 17:27:36,546 - INFO - Finished converting document 8-K_2024-10-29 in 0.05 sec.
2025-11-14 17:27:36,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,598 - INFO - Going to convert document batch...
2025-11-14 17:27:36,599 - INFO - Processing document 8-K_2024-12-17
2025-11-14 17:27:36,628 - INFO - Finished converting document 8-K_2024-12-17 in 0.06 sec.
2025-11-14 17:27:36,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,667 - INFO - Going to convert document batch...
2025-11-14 17:27:36,668 - INFO - Processing document 8-K_2025-02-04
2025-11-14 17:27:36,688 - INFO - Finished converting document 8-K_2025-02-04 in 0.05 sec.
2025-11-14 17:27:36,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,731 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\PFE\8-K_2024-10-29' --> 'data\processed_data\PFE\8-K_2024-10-29.md'
Converted 'data\edgar_documents\PFE\8-K_2024-12-17' --> 'data\processed_data\PFE\8-K_2024-12-17.md'
Converted 'data\edgar_documents\PFE\8-K_2025-02-04' --> 'data\processed_data\PFE\8-K_2025-02-04.md'


2025-11-14 17:27:36,766 - INFO - Finished converting document 8-K_2025-04-28 in 0.06 sec.
2025-11-14 17:27:36,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,857 - INFO - Going to convert document batch...
2025-11-14 17:27:36,858 - INFO - Processing document 8-K_2025-04-29
2025-11-14 17:27:36,890 - INFO - Finished converting document 8-K_2025-04-29 in 0.06 sec.
2025-11-14 17:27:36,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,931 - INFO - Going to convert document batch...
2025-11-14 17:27:36,932 - INFO - Processing document 8-K_2025-05-19
2025-11-14 17:27:36,960 - INFO - Finished converting document 8-K_2025-05-19 in 0.05 sec.
2025-11-14 17:27:36,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:36,998 - INFO - Going to convert document batch...
2025-11-14 17:27:36,999 - INFO - Processing document 8-K_2025-08-05


Converted 'data\edgar_documents\PFE\8-K_2025-04-28' --> 'data\processed_data\PFE\8-K_2025-04-28.md'
Converted 'data\edgar_documents\PFE\8-K_2025-04-29' --> 'data\processed_data\PFE\8-K_2025-04-29.md'
Converted 'data\edgar_documents\PFE\8-K_2025-05-19' --> 'data\processed_data\PFE\8-K_2025-05-19.md'


2025-11-14 17:27:37,022 - INFO - Finished converting document 8-K_2025-08-05 in 0.05 sec.
2025-11-14 17:27:37,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:27:37,062 - INFO - Going to convert document batch...
2025-11-14 17:27:37,063 - INFO - Processing document 8-K_2025-11-04
2025-11-14 17:27:37,092 - INFO - Finished converting document 8-K_2025-11-04 in 0.06 sec.
2025-11-14 17:27:37,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\8-K_2025-08-05' --> 'data\processed_data\PFE\8-K_2025-08-05.md'
Converted 'data\edgar_documents\PFE\8-K_2025-11-04' --> 'data\processed_data\PFE\8-K_2025-11-04.md'


2025-11-14 17:27:37,887 - INFO - Going to convert document batch...
2025-11-14 17:27:37,887 - INFO - Processing document DEF-14A_2023-03-16
2025-11-14 17:27:40,060 - INFO - Finished converting document DEF-14A_2023-03-16 in 2.95 sec.
2025-11-14 17:27:41,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\DEF-14A_2023-03-16' --> 'data\processed_data\PFE\DEF-14A_2023-03-16.md'


2025-11-14 17:27:42,074 - INFO - Going to convert document batch...
2025-11-14 17:27:42,075 - INFO - Processing document DEF-14A_2024-03-14
2025-11-14 17:27:44,329 - INFO - Finished converting document DEF-14A_2024-03-14 in 2.83 sec.
2025-11-14 17:27:45,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\DEF-14A_2024-03-14' --> 'data\processed_data\PFE\DEF-14A_2024-03-14.md'


2025-11-14 17:27:46,404 - INFO - Going to convert document batch...
2025-11-14 17:27:46,405 - INFO - Processing document DEF-14A_2025-03-13
2025-11-14 17:27:48,566 - INFO - Finished converting document DEF-14A_2025-03-13 in 2.78 sec.
2025-11-14 17:27:49,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PFE\DEF-14A_2025-03-13' --> 'data\processed_data\PFE\DEF-14A_2025-03-13.md'
Processed 145 new files. Errors: 4
Found 169 files to process in data\edgar_documents\PG


2025-11-14 17:27:50,492 - INFO - Going to convert document batch...
2025-11-14 17:27:50,493 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:27:50,493 - INFO - Processing document 10-K_2023-08-04
2025-11-14 17:27:51,567 - INFO - Finished converting document 10-K_2023-08-04 in 2.02 sec.
2025-11-14 17:27:52,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-K_2023-08-04' --> 'data\processed_data\PG\10-K_2023-08-04.md'


2025-11-14 17:27:52,879 - INFO - Going to convert document batch...
2025-11-14 17:27:52,880 - INFO - Processing document 10-K_2024-08-05
2025-11-14 17:27:54,030 - INFO - Finished converting document 10-K_2024-08-05 in 1.92 sec.
2025-11-14 17:27:54,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-K_2024-08-05' --> 'data\processed_data\PG\10-K_2024-08-05.md'


2025-11-14 17:27:55,459 - INFO - Going to convert document batch...
2025-11-14 17:27:55,460 - INFO - Processing document 10-K_2025-08-04
2025-11-14 17:27:56,658 - INFO - Finished converting document 10-K_2025-08-04 in 2.06 sec.
2025-11-14 17:27:57,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-K_2025-08-04' --> 'data\processed_data\PG\10-K_2025-08-04.md'


2025-11-14 17:27:57,541 - INFO - Going to convert document batch...
2025-11-14 17:27:57,542 - INFO - Processing document 10-Q_2023-01-19
2025-11-14 17:27:58,054 - INFO - Finished converting document 10-Q_2023-01-19 in 0.78 sec.
2025-11-14 17:27:58,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-Q_2023-01-19' --> 'data\processed_data\PG\10-Q_2023-01-19.md'


2025-11-14 17:27:58,619 - INFO - Going to convert document batch...
2025-11-14 17:27:58,620 - INFO - Processing document 10-Q_2023-04-21
2025-11-14 17:27:59,482 - INFO - Finished converting document 10-Q_2023-04-21 in 1.16 sec.
2025-11-14 17:27:59,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-Q_2023-04-21' --> 'data\processed_data\PG\10-Q_2023-04-21.md'


2025-11-14 17:27:59,981 - INFO - Going to convert document batch...
2025-11-14 17:27:59,982 - INFO - Processing document 10-Q_2023-10-18
2025-11-14 17:28:00,378 - INFO - Finished converting document 10-Q_2023-10-18 in 0.62 sec.
2025-11-14 17:28:00,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-Q_2023-10-18' --> 'data\processed_data\PG\10-Q_2023-10-18.md'


2025-11-14 17:28:00,956 - INFO - Going to convert document batch...
2025-11-14 17:28:00,957 - INFO - Processing document 10-Q_2024-01-23
2025-11-14 17:28:01,494 - INFO - Finished converting document 10-Q_2024-01-23 in 0.89 sec.
2025-11-14 17:28:01,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-Q_2024-01-23' --> 'data\processed_data\PG\10-Q_2024-01-23.md'


2025-11-14 17:28:02,471 - INFO - Going to convert document batch...
2025-11-14 17:28:02,472 - INFO - Processing document 10-Q_2024-04-19
2025-11-14 17:28:03,017 - INFO - Finished converting document 10-Q_2024-04-19 in 1.20 sec.
2025-11-14 17:28:03,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-Q_2024-04-19' --> 'data\processed_data\PG\10-Q_2024-04-19.md'


2025-11-14 17:28:03,568 - INFO - Going to convert document batch...
2025-11-14 17:28:03,569 - INFO - Processing document 10-Q_2024-10-18
2025-11-14 17:28:04,022 - INFO - Finished converting document 10-Q_2024-10-18 in 0.69 sec.
2025-11-14 17:28:04,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-Q_2024-10-18' --> 'data\processed_data\PG\10-Q_2024-10-18.md'


2025-11-14 17:28:04,881 - INFO - Going to convert document batch...
2025-11-14 17:28:04,882 - INFO - Processing document 10-Q_2025-01-22
2025-11-14 17:28:05,464 - INFO - Finished converting document 10-Q_2025-01-22 in 1.19 sec.
2025-11-14 17:28:05,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-Q_2025-01-22' --> 'data\processed_data\PG\10-Q_2025-01-22.md'


2025-11-14 17:28:06,100 - INFO - Going to convert document batch...
2025-11-14 17:28:06,101 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 17:28:06,679 - INFO - Finished converting document 10-Q_2025-04-24 in 0.89 sec.
2025-11-14 17:28:07,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\10-Q_2025-04-24' --> 'data\processed_data\PG\10-Q_2025-04-24.md'


2025-11-14 17:28:07,510 - INFO - Going to convert document batch...
2025-11-14 17:28:07,511 - INFO - Processing document 10-Q_2025-10-24
2025-11-14 17:28:07,997 - INFO - Finished converting document 10-Q_2025-10-24 in 1.00 sec.
2025-11-14 17:28:08,333 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:08,335 - ERROR - Input document 4_2023-01-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:28:08,337 - INFO - Going to convert document batch...
2025-11-14 17:28:08,35

Converted 'data\edgar_documents\PG\10-Q_2025-10-24' --> 'data\processed_data\PG\10-Q_2025-10-24.md'
Error processing data\edgar_documents\PG\4_2023-01-23: File format not allowed: data\edgar_documents\PG\4_2023-01-23
Error processing data\edgar_documents\PG\4_2023-01-25: File format not allowed: data\edgar_documents\PG\4_2023-01-25
Error processing data\edgar_documents\PG\4_2023-01-27: File format not allowed: data\edgar_documents\PG\4_2023-01-27
Error processing data\edgar_documents\PG\4_2023-01-31: File format not allowed: data\edgar_documents\PG\4_2023-01-31
Converted 'data\edgar_documents\PG\4_2023-02-06' --> 'data\processed_data\PG\4_2023-02-06.md'


2025-11-14 17:28:08,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:08,510 - INFO - Going to convert document batch...
2025-11-14 17:28:08,512 - INFO - Processing document 4_2023-03-02
2025-11-14 17:28:08,531 - INFO - Finished converting document 4_2023-03-02 in 0.06 sec.
2025-11-14 17:28:08,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:08,573 - INFO - Going to convert document batch...
2025-11-14 17:28:08,574 - INFO - Processing document 4_2023-03-15
2025-11-14 17:28:08,592 - INFO - Finished converting document 4_2023-03-15 in 0.05 sec.
2025-11-14 17:28:08,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:08,676 - INFO - Going to convert document batch...
2025-11-14 17:28:08,678 - INFO - Processing document 4_2023-04-24
2025-11-14 17:28:08,708 - INFO - Finished converting document 4_2023-04-24 in 0.09 sec.


Converted 'data\edgar_documents\PG\4_2023-03-02' --> 'data\processed_data\PG\4_2023-03-02.md'
Converted 'data\edgar_documents\PG\4_2023-03-15' --> 'data\processed_data\PG\4_2023-03-15.md'


2025-11-14 17:28:08,746 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:08,757 - INFO - Going to convert document batch...
2025-11-14 17:28:08,757 - INFO - Processing document 4_2023-04-25
2025-11-14 17:28:08,781 - INFO - Finished converting document 4_2023-04-25 in 0.05 sec.
2025-11-14 17:28:08,829 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:08,830 - ERROR - Input document 4_2023-04-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:28

Converted 'data\edgar_documents\PG\4_2023-04-24' --> 'data\processed_data\PG\4_2023-04-24.md'
Converted 'data\edgar_documents\PG\4_2023-04-25' --> 'data\processed_data\PG\4_2023-04-25.md'
Error processing data\edgar_documents\PG\4_2023-04-26: File format not allowed: data\edgar_documents\PG\4_2023-04-26
Converted 'data\edgar_documents\PG\4_2023-04-27' --> 'data\processed_data\PG\4_2023-04-27.md'


2025-11-14 17:28:08,931 - INFO - Going to convert document batch...
2025-11-14 17:28:08,932 - INFO - Processing document 4_2023-04-28
2025-11-14 17:28:08,956 - INFO - Finished converting document 4_2023-04-28 in 0.05 sec.
2025-11-14 17:28:09,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,034 - INFO - Going to convert document batch...
2025-11-14 17:28:09,035 - INFO - Processing document 4_2023-05-02
2025-11-14 17:28:09,065 - INFO - Finished converting document 4_2023-05-02 in 0.06 sec.
2025-11-14 17:28:09,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,131 - INFO - Going to convert document batch...
2025-11-14 17:28:09,132 - INFO - Processing document 4_2023-06-14
2025-11-14 17:28:09,158 - INFO - Finished converting document 4_2023-06-14 in 0.06 sec.
2025-11-14 17:28:09,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\4_2023-04-28' --> 'data\processed_data\PG\4_2023-04-28.md'
Converted 'data\edgar_documents\PG\4_2023-05-02' --> 'data\processed_data\PG\4_2023-05-02.md'
Converted 'data\edgar_documents\PG\4_2023-06-14' --> 'data\processed_data\PG\4_2023-06-14.md'


2025-11-14 17:28:09,205 - INFO - Going to convert document batch...
2025-11-14 17:28:09,205 - INFO - Processing document 4_2023-08-01
2025-11-14 17:28:09,230 - INFO - Finished converting document 4_2023-08-01 in 0.06 sec.
2025-11-14 17:28:09,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,283 - INFO - Going to convert document batch...
2025-11-14 17:28:09,284 - INFO - Processing document 4_2023-08-02
2025-11-14 17:28:09,314 - INFO - Finished converting document 4_2023-08-02 in 0.06 sec.
2025-11-14 17:28:09,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,384 - INFO - Going to convert document batch...
2025-11-14 17:28:09,385 - INFO - Processing document 4_2023-08-03
2025-11-14 17:28:09,412 - INFO - Finished converting document 4_2023-08-03 in 0.06 sec.


Converted 'data\edgar_documents\PG\4_2023-08-01' --> 'data\processed_data\PG\4_2023-08-01.md'
Converted 'data\edgar_documents\PG\4_2023-08-02' --> 'data\processed_data\PG\4_2023-08-02.md'
Converted 'data\edgar_documents\PG\4_2023-08-03' --> 'data\processed_data\PG\4_2023-08-03.md'


2025-11-14 17:28:09,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,473 - INFO - Going to convert document batch...
2025-11-14 17:28:09,474 - INFO - Processing document 4_2023-08-04
2025-11-14 17:28:09,491 - INFO - Finished converting document 4_2023-08-04 in 0.05 sec.
2025-11-14 17:28:09,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,540 - INFO - Going to convert document batch...
2025-11-14 17:28:09,541 - INFO - Processing document 4_2023-08-07
2025-11-14 17:28:09,572 - INFO - Finished converting document 4_2023-08-07 in 0.05 sec.
2025-11-14 17:28:09,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,640 - INFO - Going to convert document batch...
2025-11-14 17:28:09,641 - INFO - Processing document 4_2023-08-10
2025-11-14 17:28:09,670 - INFO - Finished converting document 4_2023-08-10 in 0.08 sec.
2025-11-14 17:28:09,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\4_2023-08-04' --> 'data\processed_data\PG\4_2023-08-04.md'
Converted 'data\edgar_documents\PG\4_2023-08-07' --> 'data\processed_data\PG\4_2023-08-07.md'
Converted 'data\edgar_documents\PG\4_2023-08-10' --> 'data\processed_data\PG\4_2023-08-10.md'


2025-11-14 17:28:09,716 - INFO - Going to convert document batch...
2025-11-14 17:28:09,717 - INFO - Processing document 4_2023-08-18
2025-11-14 17:28:09,738 - INFO - Finished converting document 4_2023-08-18 in 0.05 sec.
2025-11-14 17:28:09,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,811 - INFO - Going to convert document batch...
2025-11-14 17:28:09,812 - INFO - Processing document 4_2023-08-21
2025-11-14 17:28:09,839 - INFO - Finished converting document 4_2023-08-21 in 0.08 sec.
2025-11-14 17:28:09,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,878 - INFO - Going to convert document batch...
2025-11-14 17:28:09,879 - INFO - Processing document 4_2023-08-24
2025-11-14 17:28:09,900 - INFO - Finished converting document 4_2023-08-24 in 0.03 sec.
2025-11-14 17:28:09,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:09,939 - INFO - Going to convert document batch...
2025-11-14 17:28:09,940 - 

Converted 'data\edgar_documents\PG\4_2023-08-18' --> 'data\processed_data\PG\4_2023-08-18.md'
Converted 'data\edgar_documents\PG\4_2023-08-21' --> 'data\processed_data\PG\4_2023-08-21.md'
Converted 'data\edgar_documents\PG\4_2023-08-24' --> 'data\processed_data\PG\4_2023-08-24.md'


2025-11-14 17:28:09,959 - INFO - Finished converting document 4_2023-08-25 in 0.03 sec.
2025-11-14 17:28:09,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,000 - INFO - Going to convert document batch...
2025-11-14 17:28:10,001 - INFO - Processing document 4_2023-08-28
2025-11-14 17:28:10,020 - INFO - Finished converting document 4_2023-08-28 in 0.03 sec.
2025-11-14 17:28:10,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,063 - INFO - Going to convert document batch...
2025-11-14 17:28:10,064 - INFO - Processing document 4_2023-08-31
2025-11-14 17:28:10,085 - INFO - Finished converting document 4_2023-08-31 in 0.03 sec.
2025-11-14 17:28:10,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,124 - INFO - Going to convert document batch...
2025-11-14 17:28:10,124 - INFO - Processing document 4_2023-09-13
2025-11-14 17:28:10,141 - INFO - Finished converting document 4_2023-09-13 in 0.03 sec.
2025-1

Converted 'data\edgar_documents\PG\4_2023-08-25' --> 'data\processed_data\PG\4_2023-08-25.md'
Converted 'data\edgar_documents\PG\4_2023-08-28' --> 'data\processed_data\PG\4_2023-08-28.md'
Converted 'data\edgar_documents\PG\4_2023-08-31' --> 'data\processed_data\PG\4_2023-08-31.md'
Converted 'data\edgar_documents\PG\4_2023-09-13' --> 'data\processed_data\PG\4_2023-09-13.md'


2025-11-14 17:28:10,183 - INFO - Going to convert document batch...
2025-11-14 17:28:10,184 - INFO - Processing document 4_2023-09-19
2025-11-14 17:28:10,205 - INFO - Finished converting document 4_2023-09-19 in 0.05 sec.
2025-11-14 17:28:10,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,264 - INFO - Going to convert document batch...
2025-11-14 17:28:10,265 - INFO - Processing document 4_2023-10-03
2025-11-14 17:28:10,296 - INFO - Finished converting document 4_2023-10-03 in 0.08 sec.
2025-11-14 17:28:10,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,336 - INFO - Going to convert document batch...
2025-11-14 17:28:10,337 - INFO - Processing document 4_2023-10-04
2025-11-14 17:28:10,357 - INFO - Finished converting document 4_2023-10-04 in 0.05 sec.
2025-11-14 17:28:10,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,401 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PG\4_2023-09-19' --> 'data\processed_data\PG\4_2023-09-19.md'
Converted 'data\edgar_documents\PG\4_2023-10-03' --> 'data\processed_data\PG\4_2023-10-03.md'
Converted 'data\edgar_documents\PG\4_2023-10-04' --> 'data\processed_data\PG\4_2023-10-04.md'


2025-11-14 17:28:10,401 - INFO - Processing document 4_2023-10-11
2025-11-14 17:28:10,418 - INFO - Finished converting document 4_2023-10-11 in 0.05 sec.
2025-11-14 17:28:10,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,461 - INFO - Going to convert document batch...
2025-11-14 17:28:10,462 - INFO - Processing document 4_2023-10-23
2025-11-14 17:28:10,482 - INFO - Finished converting document 4_2023-10-23 in 0.05 sec.
2025-11-14 17:28:10,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,542 - INFO - Going to convert document batch...
2025-11-14 17:28:10,542 - INFO - Processing document 4_2023-10-25
2025-11-14 17:28:10,563 - INFO - Finished converting document 4_2023-10-25 in 0.06 sec.
2025-11-14 17:28:10,602 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:10,602 - ERROR - Input document 4_2023-10-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>

Converted 'data\edgar_documents\PG\4_2023-10-11' --> 'data\processed_data\PG\4_2023-10-11.md'
Converted 'data\edgar_documents\PG\4_2023-10-23' --> 'data\processed_data\PG\4_2023-10-23.md'
Converted 'data\edgar_documents\PG\4_2023-10-25' --> 'data\processed_data\PG\4_2023-10-25.md'
Error processing data\edgar_documents\PG\4_2023-10-26: File format not allowed: data\edgar_documents\PG\4_2023-10-26


2025-11-14 17:28:10,623 - ERROR - Input document 4_2023-10-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:28:10,624 - INFO - Going to convert document batch...
2025-11-14 17:28:10,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,648 - INFO - Going to convert document batch...
2025-11-14 17:28:10,649 - INFO - Processing document 4_2023-11-07
2025-11-14 17:28:10,674 - INFO - Finished converting document 4_2023-11-07 in 0.05 sec.
2025-11-14 17:28:10,710 - INFO - detec

Error processing data\edgar_documents\PG\4_2023-10-30: File format not allowed: data\edgar_documents\PG\4_2023-10-30
Converted 'data\edgar_documents\PG\4_2023-11-07' --> 'data\processed_data\PG\4_2023-11-07.md'
Converted 'data\edgar_documents\PG\4_2023-11-14' --> 'data\processed_data\PG\4_2023-11-14.md'


2025-11-14 17:28:10,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,856 - INFO - Going to convert document batch...
2025-11-14 17:28:10,857 - INFO - Processing document 4_2023-12-04
2025-11-14 17:28:10,886 - INFO - Finished converting document 4_2023-12-04 in 0.06 sec.
2025-11-14 17:28:10,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:10,958 - INFO - Going to convert document batch...
2025-11-14 17:28:10,958 - INFO - Processing document 4_2023-12-08
2025-11-14 17:28:10,984 - INFO - Finished converting document 4_2023-12-08 in 0.06 sec.
2025-11-14 17:28:11,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\4_2023-11-16' --> 'data\processed_data\PG\4_2023-11-16.md'
Converted 'data\edgar_documents\PG\4_2023-12-04' --> 'data\processed_data\PG\4_2023-12-04.md'
Converted 'data\edgar_documents\PG\4_2023-12-08' --> 'data\processed_data\PG\4_2023-12-08.md'


2025-11-14 17:28:11,028 - INFO - Going to convert document batch...
2025-11-14 17:28:11,029 - INFO - Processing document 4_2023-12-13
2025-11-14 17:28:11,047 - INFO - Finished converting document 4_2023-12-13 in 0.05 sec.
2025-11-14 17:28:11,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:11,091 - INFO - Going to convert document batch...
2025-11-14 17:28:11,093 - INFO - Processing document 4_2023-12-14
2025-11-14 17:28:11,110 - INFO - Finished converting document 4_2023-12-14 in 0.05 sec.
2025-11-14 17:28:11,173 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:11,174 - ERROR - Input document 4_2024-01-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\PG\4_2023-12-13' --> 'data\processed_data\PG\4_2023-12-13.md'
Converted 'data\edgar_documents\PG\4_2023-12-14' --> 'data\processed_data\PG\4_2023-12-14.md'
Error processing data\edgar_documents\PG\4_2024-01-24: File format not allowed: data\edgar_documents\PG\4_2024-01-24
Error processing data\edgar_documents\PG\4_2024-01-25: File format not allowed: data\edgar_documents\PG\4_2024-01-25


2025-11-14 17:28:11,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:11,299 - INFO - Going to convert document batch...
2025-11-14 17:28:11,300 - INFO - Processing document 4_2024-01-30
2025-11-14 17:28:11,325 - INFO - Finished converting document 4_2024-01-30 in 0.06 sec.
2025-11-14 17:28:11,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:11,409 - INFO - Going to convert document batch...
2025-11-14 17:28:11,409 - INFO - Processing document 4_2024-02-07
2025-11-14 17:28:11,431 - INFO - Finished converting document 4_2024-02-07 in 0.06 sec.


Converted 'data\edgar_documents\PG\4_2024-01-26' --> 'data\processed_data\PG\4_2024-01-26.md'
Converted 'data\edgar_documents\PG\4_2024-01-30' --> 'data\processed_data\PG\4_2024-01-30.md'


2025-11-14 17:28:11,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:11,476 - INFO - Going to convert document batch...
2025-11-14 17:28:11,477 - INFO - Processing document 4_2024-02-22
2025-11-14 17:28:11,507 - INFO - Finished converting document 4_2024-02-22 in 0.05 sec.
2025-11-14 17:28:11,543 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:11,553 - INFO - Going to convert document batch...
2025-11-14 17:28:11,554 - INFO - Processing document 4_2024-02-26
2025-11-14 17:28:11,578 - INFO - Finished converting document 4_2024-02-26 in 0.05 sec.
2025-11-14 17:28:11,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:11,646 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PG\4_2024-02-07' --> 'data\processed_data\PG\4_2024-02-07.md'
Converted 'data\edgar_documents\PG\4_2024-02-22' --> 'data\processed_data\PG\4_2024-02-22.md'
Converted 'data\edgar_documents\PG\4_2024-02-26' --> 'data\processed_data\PG\4_2024-02-26.md'


2025-11-14 17:28:11,647 - INFO - Processing document 4_2024-03-05
2025-11-14 17:28:11,678 - INFO - Finished converting document 4_2024-03-05 in 0.08 sec.
2025-11-14 17:28:11,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:11,723 - INFO - Going to convert document batch...
2025-11-14 17:28:11,724 - INFO - Processing document 4_2024-03-13
2025-11-14 17:28:11,742 - INFO - Finished converting document 4_2024-03-13 in 0.03 sec.
2025-11-14 17:28:11,780 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:11,781 - ERROR - Input document 4_2024-04-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\PG\4_2024-03-05' --> 'data\processed_data\PG\4_2024-03-05.md'
Converted 'data\edgar_documents\PG\4_2024-03-13' --> 'data\processed_data\PG\4_2024-03-13.md'
Error processing data\edgar_documents\PG\4_2024-04-22: File format not allowed: data\edgar_documents\PG\4_2024-04-22
Converted 'data\edgar_documents\PG\4_2024-04-23' --> 'data\processed_data\PG\4_2024-04-23.md'


2025-11-14 17:28:11,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:11,941 - INFO - Going to convert document batch...
2025-11-14 17:28:11,942 - INFO - Processing document 4_2024-05-01
2025-11-14 17:28:11,969 - INFO - Finished converting document 4_2024-05-01 in 0.05 sec.
2025-11-14 17:28:12,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:12,041 - INFO - Going to convert document batch...
2025-11-14 17:28:12,042 - INFO - Processing document 4_2024-05-07
2025-11-14 17:28:12,067 - INFO - Finished converting document 4_2024-05-07 in 0.06 sec.
2025-11-14 17:28:12,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:12,110 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PG\4_2024-04-24' --> 'data\processed_data\PG\4_2024-04-24.md'
Converted 'data\edgar_documents\PG\4_2024-05-01' --> 'data\processed_data\PG\4_2024-05-01.md'
Converted 'data\edgar_documents\PG\4_2024-05-07' --> 'data\processed_data\PG\4_2024-05-07.md'


2025-11-14 17:28:12,111 - INFO - Processing document 4_2024-05-08
2025-11-14 17:28:12,134 - INFO - Finished converting document 4_2024-05-08 in 0.03 sec.
2025-11-14 17:28:12,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:12,180 - INFO - Going to convert document batch...
2025-11-14 17:28:12,181 - INFO - Processing document 4_2024-05-10
2025-11-14 17:28:12,206 - INFO - Finished converting document 4_2024-05-10 in 0.05 sec.
2025-11-14 17:28:12,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:12,247 - INFO - Going to convert document batch...
2025-11-14 17:28:12,248 - INFO - Processing document 4_2024-05-16
2025-11-14 17:28:12,267 - INFO - Finished converting document 4_2024-05-16 in 0.05 sec.
2025-11-14 17:28:12,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:12,309 - INFO - Going to convert document batch...
2025-11-14 17:28:12,310 - INFO - Processing document 4_2024-05-17
2025-11-14 17:28:12,333 - IN

Converted 'data\edgar_documents\PG\4_2024-05-08' --> 'data\processed_data\PG\4_2024-05-08.md'
Converted 'data\edgar_documents\PG\4_2024-05-10' --> 'data\processed_data\PG\4_2024-05-10.md'
Converted 'data\edgar_documents\PG\4_2024-05-16' --> 'data\processed_data\PG\4_2024-05-16.md'
Converted 'data\edgar_documents\PG\4_2024-05-17' --> 'data\processed_data\PG\4_2024-05-17.md'


2025-11-14 17:28:12,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:12,380 - INFO - Going to convert document batch...
2025-11-14 17:28:12,381 - INFO - Processing document 4_2024-05-21
2025-11-14 17:28:12,408 - INFO - Finished converting document 4_2024-05-21 in 0.05 sec.
2025-11-14 17:28:12,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:12,838 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PG\4_2024-05-21' --> 'data\processed_data\PG\4_2024-05-21.md'


2025-11-14 17:28:12,840 - INFO - Processing document 4_2024-06-12
2025-11-14 17:28:12,860 - INFO - Finished converting document 4_2024-06-12 in 0.42 sec.
2025-11-14 17:28:12,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:12,906 - INFO - Going to convert document batch...
2025-11-14 17:28:12,907 - INFO - Processing document 4_2024-08-05
2025-11-14 17:28:12,936 - INFO - Finished converting document 4_2024-08-05 in 0.06 sec.
2025-11-14 17:28:12,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,008 - INFO - Going to convert document batch...
2025-11-14 17:28:13,009 - INFO - Processing document 4_2024-08-06
2025-11-14 17:28:13,030 - INFO - Finished converting document 4_2024-08-06 in 0.08 sec.
2025-11-14 17:28:13,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\4_2024-06-12' --> 'data\processed_data\PG\4_2024-06-12.md'
Converted 'data\edgar_documents\PG\4_2024-08-05' --> 'data\processed_data\PG\4_2024-08-05.md'
Converted 'data\edgar_documents\PG\4_2024-08-06' --> 'data\processed_data\PG\4_2024-08-06.md'


2025-11-14 17:28:13,073 - INFO - Going to convert document batch...
2025-11-14 17:28:13,074 - INFO - Processing document 4_2024-08-12
2025-11-14 17:28:13,096 - INFO - Finished converting document 4_2024-08-12 in 0.05 sec.
2025-11-14 17:28:13,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,140 - INFO - Going to convert document batch...
2025-11-14 17:28:13,141 - INFO - Processing document 4_2024-08-20
2025-11-14 17:28:13,161 - INFO - Finished converting document 4_2024-08-20 in 0.05 sec.
2025-11-14 17:28:13,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,226 - INFO - Going to convert document batch...
2025-11-14 17:28:13,227 - INFO - Processing document 4_2024-08-22
2025-11-14 17:28:13,247 - INFO - Finished converting document 4_2024-08-22 in 0.06 sec.
2025-11-14 17:28:13,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,290 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PG\4_2024-08-12' --> 'data\processed_data\PG\4_2024-08-12.md'
Converted 'data\edgar_documents\PG\4_2024-08-20' --> 'data\processed_data\PG\4_2024-08-20.md'
Converted 'data\edgar_documents\PG\4_2024-08-22' --> 'data\processed_data\PG\4_2024-08-22.md'


2025-11-14 17:28:13,291 - INFO - Processing document 4_2024-08-23
2025-11-14 17:28:13,311 - INFO - Finished converting document 4_2024-08-23 in 0.05 sec.
2025-11-14 17:28:13,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,381 - INFO - Going to convert document batch...
2025-11-14 17:28:13,382 - INFO - Processing document 4_2024-08-26
2025-11-14 17:28:13,405 - INFO - Finished converting document 4_2024-08-26 in 0.06 sec.
2025-11-14 17:28:13,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,447 - INFO - Going to convert document batch...
2025-11-14 17:28:13,448 - INFO - Processing document 4_2024-08-27
2025-11-14 17:28:13,469 - INFO - Finished converting document 4_2024-08-27 in 0.05 sec.
2025-11-14 17:28:13,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,525 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PG\4_2024-08-23' --> 'data\processed_data\PG\4_2024-08-23.md'
Converted 'data\edgar_documents\PG\4_2024-08-26' --> 'data\processed_data\PG\4_2024-08-26.md'
Converted 'data\edgar_documents\PG\4_2024-08-27' --> 'data\processed_data\PG\4_2024-08-27.md'


2025-11-14 17:28:13,526 - INFO - Processing document 4_2024-08-29
2025-11-14 17:28:13,547 - INFO - Finished converting document 4_2024-08-29 in 0.06 sec.
2025-11-14 17:28:13,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,590 - INFO - Going to convert document batch...
2025-11-14 17:28:13,591 - INFO - Processing document 4_2024-09-11
2025-11-14 17:28:13,609 - INFO - Finished converting document 4_2024-09-11 in 0.05 sec.
2025-11-14 17:28:13,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,663 - INFO - Going to convert document batch...
2025-11-14 17:28:13,664 - INFO - Processing document 4_2024-09-16
2025-11-14 17:28:13,701 - INFO - Finished converting document 4_2024-09-16 in 0.08 sec.
2025-11-14 17:28:13,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,742 - INFO - Going to convert document batch...
2025-11-14 17:28:13,743 - INFO - Processing document 4_2024-10-03
2025-11-14 17:28:13,765 - IN

Converted 'data\edgar_documents\PG\4_2024-08-29' --> 'data\processed_data\PG\4_2024-08-29.md'
Converted 'data\edgar_documents\PG\4_2024-09-11' --> 'data\processed_data\PG\4_2024-09-11.md'
Converted 'data\edgar_documents\PG\4_2024-09-16' --> 'data\processed_data\PG\4_2024-09-16.md'


2025-11-14 17:28:13,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,810 - INFO - Going to convert document batch...
2025-11-14 17:28:13,810 - INFO - Processing document 4_2024-10-04
2025-11-14 17:28:13,835 - INFO - Finished converting document 4_2024-10-04 in 0.05 sec.
2025-11-14 17:28:13,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,892 - INFO - Going to convert document batch...
2025-11-14 17:28:13,892 - INFO - Processing document 4_2024-10-09
2025-11-14 17:28:13,911 - INFO - Finished converting document 4_2024-10-09 in 0.05 sec.
2025-11-14 17:28:13,952 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:13,952 - ERROR - Input document 4_2024-10-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\PG\4_2024-10-03' --> 'data\processed_data\PG\4_2024-10-03.md'
Converted 'data\edgar_documents\PG\4_2024-10-04' --> 'data\processed_data\PG\4_2024-10-04.md'
Converted 'data\edgar_documents\PG\4_2024-10-09' --> 'data\processed_data\PG\4_2024-10-09.md'
Error processing data\edgar_documents\PG\4_2024-10-21: File format not allowed: data\edgar_documents\PG\4_2024-10-21


2025-11-14 17:28:13,974 - ERROR - Input document 4_2024-10-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:28:13,975 - INFO - Going to convert document batch...
2025-11-14 17:28:13,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:13,995 - INFO - Going to convert document batch...
2025-11-14 17:28:13,996 - INFO - Processing document 4_2024-10-23
2025-11-14 17:28:14,019 - INFO - Finished converting document 4_2024-10-23 in 0.05 sec.
2025-11-14 17:28:14,052 - INFO - detec

Error processing data\edgar_documents\PG\4_2024-10-22: File format not allowed: data\edgar_documents\PG\4_2024-10-22
Converted 'data\edgar_documents\PG\4_2024-10-23' --> 'data\processed_data\PG\4_2024-10-23.md'
Converted 'data\edgar_documents\PG\4_2024-10-24' --> 'data\processed_data\PG\4_2024-10-24.md'


2025-11-14 17:28:14,156 - INFO - Processing document 4_2024-10-25
2025-11-14 17:28:14,177 - INFO - Finished converting document 4_2024-10-25 in 0.03 sec.
2025-11-14 17:28:14,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:14,224 - INFO - Going to convert document batch...
2025-11-14 17:28:14,225 - INFO - Processing document 4_2024-11-25
2025-11-14 17:28:14,250 - INFO - Finished converting document 4_2024-11-25 in 0.05 sec.
2025-11-14 17:28:14,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:14,293 - INFO - Going to convert document batch...
2025-11-14 17:28:14,294 - INFO - Processing document 4_2024-12-02
2025-11-14 17:28:14,318 - INFO - Finished converting document 4_2024-12-02 in 0.05 sec.
2025-11-14 17:28:14,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:14,360 - INFO - Going to convert document batch...
2025-11-14 17:28:14,362 - INFO - Processing document 4_2024-12-11
2025-11-14 17:28:14,380 - IN

Converted 'data\edgar_documents\PG\4_2024-10-25' --> 'data\processed_data\PG\4_2024-10-25.md'
Converted 'data\edgar_documents\PG\4_2024-11-25' --> 'data\processed_data\PG\4_2024-11-25.md'
Converted 'data\edgar_documents\PG\4_2024-12-02' --> 'data\processed_data\PG\4_2024-12-02.md'


2025-11-14 17:28:14,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:14,425 - INFO - Going to convert document batch...
2025-11-14 17:28:14,426 - INFO - Processing document 4_2024-12-20
2025-11-14 17:28:14,456 - INFO - Finished converting document 4_2024-12-20 in 0.05 sec.
2025-11-14 17:28:14,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:14,510 - INFO - Going to convert document batch...
2025-11-14 17:28:14,510 - INFO - Processing document 4_2025-01-27
2025-11-14 17:28:14,534 - INFO - Finished converting document 4_2025-01-27 in 0.05 sec.


Converted 'data\edgar_documents\PG\4_2024-12-11' --> 'data\processed_data\PG\4_2024-12-11.md'
Converted 'data\edgar_documents\PG\4_2024-12-20' --> 'data\processed_data\PG\4_2024-12-20.md'
Converted 'data\edgar_documents\PG\4_2025-01-27' --> 'data\processed_data\PG\4_2025-01-27.md'


2025-11-14 17:28:14,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:14,597 - INFO - Going to convert document batch...
2025-11-14 17:28:14,598 - INFO - Processing document 4_2025-02-06
2025-11-14 17:28:14,616 - INFO - Finished converting document 4_2025-02-06 in 0.05 sec.
2025-11-14 17:28:14,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:14,677 - INFO - Going to convert document batch...
2025-11-14 17:28:14,679 - INFO - Processing document 4_2025-02-25
2025-11-14 17:28:14,704 - INFO - Finished converting document 4_2025-02-25 in 0.05 sec.
2025-11-14 17:28:14,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:14,748 - INFO - Going to convert document batch...
2025-11-14 17:28:14,749 - INFO - Processing document 4_2025-03-03
2025-11-14 17:28:14,770 - INFO - Finished converting document 4_2025-03-03 in 0.05 sec.
2025-11-14 17:28:14,806 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\PG\4_2025-02-06' --> 'data\processed_data\PG\4_2025-02-06.md'
Converted 'data\edgar_documents\PG\4_2025-02-25' --> 'data\processed_data\PG\4_2025-02-25.md'
Converted 'data\edgar_documents\PG\4_2025-03-03' --> 'data\processed_data\PG\4_2025-03-03.md'


2025-11-14 17:28:14,871 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:14,872 - ERROR - Input document 4_2025-04-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:28:14,873 - INFO - Going to convert document batch...
2025-11-14 17:28:14,893 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:14,893 - ERROR - Input document 4_2025-04-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\PG\4_2025-03-12' --> 'data\processed_data\PG\4_2025-03-12.md'
Error processing data\edgar_documents\PG\4_2025-04-28: File format not allowed: data\edgar_documents\PG\4_2025-04-28
Error processing data\edgar_documents\PG\4_2025-04-29: File format not allowed: data\edgar_documents\PG\4_2025-04-29
Converted 'data\edgar_documents\PG\4_2025-04-30' --> 'data\processed_data\PG\4_2025-04-30.md'


2025-11-14 17:28:15,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,064 - INFO - Going to convert document batch...
2025-11-14 17:28:15,064 - INFO - Processing document 4_2025-06-11
2025-11-14 17:28:15,085 - INFO - Finished converting document 4_2025-06-11 in 0.03 sec.
2025-11-14 17:28:15,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,130 - INFO - Going to convert document batch...
2025-11-14 17:28:15,131 - INFO - Processing document 4_2025-08-07
2025-11-14 17:28:15,162 - INFO - Finished converting document 4_2025-08-07 in 0.05 sec.
2025-11-14 17:28:15,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,234 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PG\4_2025-05-06' --> 'data\processed_data\PG\4_2025-05-06.md'
Converted 'data\edgar_documents\PG\4_2025-06-11' --> 'data\processed_data\PG\4_2025-06-11.md'
Converted 'data\edgar_documents\PG\4_2025-08-07' --> 'data\processed_data\PG\4_2025-08-07.md'


2025-11-14 17:28:15,234 - INFO - Processing document 4_2025-08-20
2025-11-14 17:28:15,257 - INFO - Finished converting document 4_2025-08-20 in 0.06 sec.
2025-11-14 17:28:15,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,301 - INFO - Going to convert document batch...
2025-11-14 17:28:15,301 - INFO - Processing document 4_2025-08-21
2025-11-14 17:28:15,322 - INFO - Finished converting document 4_2025-08-21 in 0.03 sec.
2025-11-14 17:28:15,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,390 - INFO - Going to convert document batch...
2025-11-14 17:28:15,391 - INFO - Processing document 4_2025-08-22
2025-11-14 17:28:15,409 - INFO - Finished converting document 4_2025-08-22 in 0.05 sec.
2025-11-14 17:28:15,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,476 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PG\4_2025-08-20' --> 'data\processed_data\PG\4_2025-08-20.md'
Converted 'data\edgar_documents\PG\4_2025-08-21' --> 'data\processed_data\PG\4_2025-08-21.md'
Converted 'data\edgar_documents\PG\4_2025-08-22' --> 'data\processed_data\PG\4_2025-08-22.md'


2025-11-14 17:28:15,478 - INFO - Processing document 4_2025-08-27
2025-11-14 17:28:15,507 - INFO - Finished converting document 4_2025-08-27 in 0.08 sec.
2025-11-14 17:28:15,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,551 - INFO - Going to convert document batch...
2025-11-14 17:28:15,552 - INFO - Processing document 4_2025-08-29
2025-11-14 17:28:15,571 - INFO - Finished converting document 4_2025-08-29 in 0.03 sec.
2025-11-14 17:28:15,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,608 - INFO - Going to convert document batch...
2025-11-14 17:28:15,609 - INFO - Processing document 4_2025-09-10
2025-11-14 17:28:15,627 - INFO - Finished converting document 4_2025-09-10 in 0.03 sec.
2025-11-14 17:28:15,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,666 - INFO - Going to convert document batch...
2025-11-14 17:28:15,667 - INFO - Processing document 4_2025-09-17
2025-11-14 17:28:15,686 - IN

Converted 'data\edgar_documents\PG\4_2025-08-27' --> 'data\processed_data\PG\4_2025-08-27.md'
Converted 'data\edgar_documents\PG\4_2025-08-29' --> 'data\processed_data\PG\4_2025-08-29.md'
Converted 'data\edgar_documents\PG\4_2025-09-10' --> 'data\processed_data\PG\4_2025-09-10.md'
Converted 'data\edgar_documents\PG\4_2025-09-17' --> 'data\processed_data\PG\4_2025-09-17.md'


2025-11-14 17:28:15,747 - INFO - Going to convert document batch...
2025-11-14 17:28:15,748 - INFO - Processing document 4_2025-10-02
2025-11-14 17:28:15,766 - INFO - Finished converting document 4_2025-10-02 in 0.06 sec.
2025-11-14 17:28:15,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,811 - INFO - Going to convert document batch...
2025-11-14 17:28:15,812 - INFO - Processing document 4_2025-10-06
2025-11-14 17:28:15,830 - INFO - Finished converting document 4_2025-10-06 in 0.03 sec.
2025-11-14 17:28:15,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:15,891 - INFO - Going to convert document batch...
2025-11-14 17:28:15,892 - INFO - Processing document 4_2025-10-15
2025-11-14 17:28:15,908 - INFO - Finished converting document 4_2025-10-15 in 0.06 sec.
2025-11-14 17:28:15,973 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:15,975 - ERROR - Input document 4_2025-10-27 with format None does 

Converted 'data\edgar_documents\PG\4_2025-10-02' --> 'data\processed_data\PG\4_2025-10-02.md'
Converted 'data\edgar_documents\PG\4_2025-10-06' --> 'data\processed_data\PG\4_2025-10-06.md'
Converted 'data\edgar_documents\PG\4_2025-10-15' --> 'data\processed_data\PG\4_2025-10-15.md'
Error processing data\edgar_documents\PG\4_2025-10-27: File format not allowed: data\edgar_documents\PG\4_2025-10-27


2025-11-14 17:28:16,006 - ERROR - Input document 4_2025-10-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:28:16,010 - INFO - Going to convert document batch...
2025-11-14 17:28:16,059 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:16,060 - ERROR - Input document 4_2025-10-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\PG\4_2025-10-28: File format not allowed: data\edgar_documents\PG\4_2025-10-28
Error processing data\edgar_documents\PG\4_2025-10-29: File format not allowed: data\edgar_documents\PG\4_2025-10-29
Error processing data\edgar_documents\PG\4_2025-10-30: File format not allowed: data\edgar_documents\PG\4_2025-10-30
Converted 'data\edgar_documents\PG\4_2025-11-07' --> 'data\processed_data\PG\4_2025-11-07.md'


2025-11-14 17:28:16,251 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:16,276 - INFO - Going to convert document batch...
2025-11-14 17:28:16,277 - INFO - Processing document 8-K_2023-01-19
2025-11-14 17:28:16,308 - INFO - Finished converting document 8-K_2023-01-19 in 0.08 sec.
2025-11-14 17:28:16,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:16,353 - INFO - Going to convert document batch...
2025-11-14 17:28:16,354 - INFO - Processing document 8-K_2023-01-26
2025-11-14 17:28:16,386 - INFO - Finished converting document 8-K_2023-01-26 in 0.08 sec.
2025-11-14 17:28:16,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\8-K_2023-01-10' --> 'data\processed_data\PG\8-K_2023-01-10.md'
Converted 'data\edgar_documents\PG\8-K_2023-01-19' --> 'data\processed_data\PG\8-K_2023-01-19.md'
Converted 'data\edgar_documents\PG\8-K_2023-01-26' --> 'data\processed_data\PG\8-K_2023-01-26.md'


2025-11-14 17:28:16,445 - INFO - Going to convert document batch...
2025-11-14 17:28:16,446 - INFO - Processing document 8-K_2023-02-03
2025-11-14 17:28:16,473 - INFO - Finished converting document 8-K_2023-02-03 in 0.06 sec.
2025-11-14 17:28:16,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:16,529 - INFO - Going to convert document batch...
2025-11-14 17:28:16,530 - INFO - Processing document 8-K_2023-04-11
2025-11-14 17:28:16,571 - INFO - Finished converting document 8-K_2023-04-11 in 0.08 sec.
2025-11-14 17:28:16,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:16,621 - INFO - Going to convert document batch...
2025-11-14 17:28:16,622 - INFO - Processing document 8-K_2023-04-21
2025-11-14 17:28:16,654 - INFO - Finished converting document 8-K_2023-04-21 in 0.08 sec.
2025-11-14 17:28:16,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\8-K_2023-02-03' --> 'data\processed_data\PG\8-K_2023-02-03.md'
Converted 'data\edgar_documents\PG\8-K_2023-04-11' --> 'data\processed_data\PG\8-K_2023-04-11.md'
Converted 'data\edgar_documents\PG\8-K_2023-04-21' --> 'data\processed_data\PG\8-K_2023-04-21.md'


2025-11-14 17:28:16,920 - INFO - Going to convert document batch...
2025-11-14 17:28:16,921 - INFO - Processing document 8-K_2023-05-02
2025-11-14 17:28:16,947 - INFO - Finished converting document 8-K_2023-05-02 in 0.28 sec.
2025-11-14 17:28:16,977 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,004 - INFO - Going to convert document batch...
2025-11-14 17:28:17,005 - INFO - Processing document 8-K_2023-07-11
2025-11-14 17:28:17,036 - INFO - Finished converting document 8-K_2023-07-11 in 0.08 sec.
2025-11-14 17:28:17,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,111 - INFO - Going to convert document batch...
2025-11-14 17:28:17,112 - INFO - Processing document 8-K_2023-07-28
2025-11-14 17:28:17,140 - INFO - Finished converting document 8-K_2023-07-28 in 0.09 sec.


Converted 'data\edgar_documents\PG\8-K_2023-05-02' --> 'data\processed_data\PG\8-K_2023-05-02.md'
Converted 'data\edgar_documents\PG\8-K_2023-07-11' --> 'data\processed_data\PG\8-K_2023-07-11.md'


2025-11-14 17:28:17,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,189 - INFO - Going to convert document batch...
2025-11-14 17:28:17,190 - INFO - Processing document 8-K_2023-10-10
2025-11-14 17:28:17,224 - INFO - Finished converting document 8-K_2023-10-10 in 0.06 sec.
2025-11-14 17:28:17,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,324 - INFO - Going to convert document batch...
2025-11-14 17:28:17,325 - INFO - Processing document 8-K_2023-10-13


Converted 'data\edgar_documents\PG\8-K_2023-07-28' --> 'data\processed_data\PG\8-K_2023-07-28.md'
Converted 'data\edgar_documents\PG\8-K_2023-10-10' --> 'data\processed_data\PG\8-K_2023-10-10.md'


2025-11-14 17:28:17,364 - INFO - Finished converting document 8-K_2023-10-13 in 0.12 sec.
2025-11-14 17:28:17,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,440 - INFO - Going to convert document batch...
2025-11-14 17:28:17,442 - INFO - Processing document 8-K_2023-10-18
2025-11-14 17:28:17,485 - INFO - Finished converting document 8-K_2023-10-18 in 0.11 sec.
2025-11-14 17:28:17,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,529 - INFO - Going to convert document batch...
2025-11-14 17:28:17,529 - INFO - Processing document 8-K_2023-11-01
2025-11-14 17:28:17,556 - INFO - Finished converting document 8-K_2023-11-01 in 0.05 sec.


Converted 'data\edgar_documents\PG\8-K_2023-10-13' --> 'data\processed_data\PG\8-K_2023-10-13.md'
Converted 'data\edgar_documents\PG\8-K_2023-10-18' --> 'data\processed_data\PG\8-K_2023-10-18.md'


2025-11-14 17:28:17,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,604 - INFO - Going to convert document batch...
2025-11-14 17:28:17,605 - INFO - Processing document 8-K_2023-12-05
2025-11-14 17:28:17,638 - INFO - Finished converting document 8-K_2023-12-05 in 0.08 sec.
2025-11-14 17:28:17,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,701 - INFO - Going to convert document batch...
2025-11-14 17:28:17,702 - INFO - Processing document 8-K_2023-12-13
2025-11-14 17:28:17,737 - INFO - Finished converting document 8-K_2023-12-13 in 0.08 sec.


Converted 'data\edgar_documents\PG\8-K_2023-11-01' --> 'data\processed_data\PG\8-K_2023-11-01.md'
Converted 'data\edgar_documents\PG\8-K_2023-12-05' --> 'data\processed_data\PG\8-K_2023-12-05.md'


2025-11-14 17:28:17,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,789 - INFO - Going to convert document batch...
2025-11-14 17:28:17,790 - INFO - Processing document 8-K_2024-01-09
2025-11-14 17:28:17,824 - INFO - Finished converting document 8-K_2024-01-09 in 0.08 sec.
2025-11-14 17:28:17,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:17,906 - INFO - Going to convert document batch...
2025-11-14 17:28:17,907 - INFO - Processing document 8-K_2024-01-23


Converted 'data\edgar_documents\PG\8-K_2023-12-13' --> 'data\processed_data\PG\8-K_2023-12-13.md'
Converted 'data\edgar_documents\PG\8-K_2024-01-09' --> 'data\processed_data\PG\8-K_2024-01-09.md'


2025-11-14 17:28:17,948 - INFO - Finished converting document 8-K_2024-01-23 in 0.12 sec.
2025-11-14 17:28:17,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:18,005 - INFO - Going to convert document batch...
2025-11-14 17:28:18,006 - INFO - Processing document 8-K_2024-01-29
2025-11-14 17:28:18,037 - INFO - Finished converting document 8-K_2024-01-29 in 0.06 sec.
2025-11-14 17:28:18,087 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:18,088 - ERROR - Input document 8-K_2024-04-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS:

Converted 'data\edgar_documents\PG\8-K_2024-01-23' --> 'data\processed_data\PG\8-K_2024-01-23.md'
Converted 'data\edgar_documents\PG\8-K_2024-01-29' --> 'data\processed_data\PG\8-K_2024-01-29.md'
Error processing data\edgar_documents\PG\8-K_2024-04-09: File format not allowed: data\edgar_documents\PG\8-K_2024-04-09
Error processing data\edgar_documents\PG\8-K_2024-04-19: File format not allowed: data\edgar_documents\PG\8-K_2024-04-19


2025-11-14 17:28:18,195 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:18,196 - ERROR - Input document 8-K_2024-07-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:28:18,197 - INFO - Going to convert document batch...
2025-11-14 17:28:18,213 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:18,214 - ERROR - Input document 8-K_2024-07-30 with format None does 

Converted 'data\edgar_documents\PG\8-K_2024-04-29' --> 'data\processed_data\PG\8-K_2024-04-29.md'
Error processing data\edgar_documents\PG\8-K_2024-07-09: File format not allowed: data\edgar_documents\PG\8-K_2024-07-09
Error processing data\edgar_documents\PG\8-K_2024-07-30: File format not allowed: data\edgar_documents\PG\8-K_2024-07-30
Error processing data\edgar_documents\PG\8-K_2024-10-08: File format not allowed: data\edgar_documents\PG\8-K_2024-10-08
Error processing data\edgar_documents\PG\8-K_2024-10-10: File format not allowed: data\edgar_documents\PG\8-K_2024-10-10
Error processing data\edgar_documents\PG\8-K_2024-10-18: File format not allowed: data\edgar_documents\PG\8-K_2024-10-18


2025-11-14 17:28:18,397 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:18,398 - ERROR - Input document 8-K_2025-01-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:28:18,399 - INFO - Going to convert document batch...
2025-11-14 17:28:18,414 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:18,414 - ERROR - Input document 8-K_2025-01-22 with format None does 

Converted 'data\edgar_documents\PG\8-K_2024-10-24' --> 'data\processed_data\PG\8-K_2024-10-24.md'
Error processing data\edgar_documents\PG\8-K_2025-01-14: File format not allowed: data\edgar_documents\PG\8-K_2025-01-14
Error processing data\edgar_documents\PG\8-K_2025-01-22: File format not allowed: data\edgar_documents\PG\8-K_2025-01-22
Error processing data\edgar_documents\PG\8-K_2025-04-08: File format not allowed: data\edgar_documents\PG\8-K_2025-04-08
Error processing data\edgar_documents\PG\8-K_2025-04-24: File format not allowed: data\edgar_documents\PG\8-K_2025-04-24
Converted 'data\edgar_documents\PG\8-K_2025-05-01' --> 'data\processed_data\PG\8-K_2025-05-01.md'


2025-11-14 17:28:18,571 - ERROR - Input document 8-K_2025-06-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:28:18,572 - INFO - Going to convert document batch...
2025-11-14 17:28:18,589 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:18,590 - ERROR - Input document 8-K_2025-06-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, 

Error processing data\edgar_documents\PG\8-K_2025-06-05: File format not allowed: data\edgar_documents\PG\8-K_2025-06-05
Error processing data\edgar_documents\PG\8-K_2025-06-09: File format not allowed: data\edgar_documents\PG\8-K_2025-06-09
Error processing data\edgar_documents\PG\8-K_2025-07-08: File format not allowed: data\edgar_documents\PG\8-K_2025-07-08
Error processing data\edgar_documents\PG\8-K_2025-07-28: File format not allowed: data\edgar_documents\PG\8-K_2025-07-28
Converted 'data\edgar_documents\PG\8-K_2025-07-29' --> 'data\processed_data\PG\8-K_2025-07-29.md'
Converted 'data\edgar_documents\PG\8-K_2025-08-14' --> 'data\processed_data\PG\8-K_2025-08-14.md'


2025-11-14 17:28:18,772 - INFO - Processing document 8-K_2025-10-14
2025-11-14 17:28:18,793 - INFO - Finished converting document 8-K_2025-10-14 in 0.06 sec.
2025-11-14 17:28:18,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:18,848 - INFO - Going to convert document batch...
2025-11-14 17:28:18,848 - INFO - Processing document 8-K_2025-10-16
2025-11-14 17:28:18,884 - INFO - Finished converting document 8-K_2025-10-16 in 0.08 sec.
2025-11-14 17:28:18,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:18,930 - INFO - Going to convert document batch...
2025-11-14 17:28:18,931 - INFO - Processing document 8-K_2025-10-24
2025-11-14 17:28:18,953 - INFO - Finished converting document 8-K_2025-10-24 in 0.05 sec.
2025-11-14 17:28:18,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\8-K_2025-10-14' --> 'data\processed_data\PG\8-K_2025-10-14.md'
Converted 'data\edgar_documents\PG\8-K_2025-10-16' --> 'data\processed_data\PG\8-K_2025-10-16.md'
Converted 'data\edgar_documents\PG\8-K_2025-10-24' --> 'data\processed_data\PG\8-K_2025-10-24.md'


2025-11-14 17:28:18,994 - INFO - Going to convert document batch...
2025-11-14 17:28:18,995 - INFO - Processing document 8-K_2025-11-03
2025-11-14 17:28:19,024 - INFO - Finished converting document 8-K_2025-11-03 in 0.05 sec.
2025-11-14 17:28:19,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:19,088 - INFO - Going to convert document batch...
2025-11-14 17:28:19,089 - INFO - Processing document 8-K_2025-11-04
2025-11-14 17:28:19,127 - INFO - Finished converting document 8-K_2025-11-04 in 0.09 sec.
2025-11-14 17:28:19,178 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:28:19,179 - ERROR - Input document DEF-14A_2023-08-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputForm

Converted 'data\edgar_documents\PG\8-K_2025-11-03' --> 'data\processed_data\PG\8-K_2025-11-03.md'
Converted 'data\edgar_documents\PG\8-K_2025-11-04' --> 'data\processed_data\PG\8-K_2025-11-04.md'
Error processing data\edgar_documents\PG\DEF-14A_2023-08-25: File format not allowed: data\edgar_documents\PG\DEF-14A_2023-08-25


2025-11-14 17:28:19,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:20,267 - INFO - Going to convert document batch...
2025-11-14 17:28:20,268 - INFO - Processing document DEF-14A_2024-08-23
2025-11-14 17:28:22,107 - INFO - Finished converting document DEF-14A_2024-08-23 in 2.92 sec.
2025-11-14 17:28:23,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\DEF-14A_2024-08-23' --> 'data\processed_data\PG\DEF-14A_2024-08-23.md'


2025-11-14 17:28:24,207 - INFO - Going to convert document batch...
2025-11-14 17:28:24,208 - INFO - Processing document DEF-14A_2025-08-29
2025-11-14 17:28:25,823 - INFO - Finished converting document DEF-14A_2025-08-29 in 2.89 sec.
2025-11-14 17:28:26,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PG\DEF-14A_2025-08-29' --> 'data\processed_data\PG\DEF-14A_2025-08-29.md'
Processed 135 new files. Errors: 34
Found 201 files to process in data\edgar_documents\PLTR


2025-11-14 17:28:27,194 - INFO - Going to convert document batch...
2025-11-14 17:28:27,195 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:28:27,196 - INFO - Processing document 10-K_2023-02-21
2025-11-14 17:28:28,603 - INFO - Finished converting document 10-K_2023-02-21 in 1.84 sec.
2025-11-14 17:28:28,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-K_2023-02-21' --> 'data\processed_data\PLTR\10-K_2023-02-21.md'


2025-11-14 17:28:29,363 - INFO - Going to convert document batch...
2025-11-14 17:28:29,364 - INFO - Processing document 10-K_2024-02-20
2025-11-14 17:28:30,184 - INFO - Finished converting document 10-K_2024-02-20 in 1.25 sec.
2025-11-14 17:28:30,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-K_2024-02-20' --> 'data\processed_data\PLTR\10-K_2024-02-20.md'


2025-11-14 17:28:31,170 - INFO - Going to convert document batch...
2025-11-14 17:28:31,171 - INFO - Processing document 10-K_2025-02-18
2025-11-14 17:28:32,026 - INFO - Finished converting document 10-K_2025-02-18 in 1.55 sec.
2025-11-14 17:28:32,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-K_2025-02-18' --> 'data\processed_data\PLTR\10-K_2025-02-18.md'


2025-11-14 17:28:32,651 - INFO - Going to convert document batch...
2025-11-14 17:28:32,652 - INFO - Processing document 10-Q_2023-05-09
2025-11-14 17:28:33,099 - INFO - Finished converting document 10-Q_2023-05-09 in 0.72 sec.
2025-11-14 17:28:33,329 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-Q_2023-05-09' --> 'data\processed_data\PLTR\10-Q_2023-05-09.md'


2025-11-14 17:28:33,969 - INFO - Going to convert document batch...
2025-11-14 17:28:33,970 - INFO - Processing document 10-Q_2023-08-08
2025-11-14 17:28:34,545 - INFO - Finished converting document 10-Q_2023-08-08 in 1.25 sec.
2025-11-14 17:28:34,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-Q_2023-08-08' --> 'data\processed_data\PLTR\10-Q_2023-08-08.md'


2025-11-14 17:28:35,164 - INFO - Going to convert document batch...
2025-11-14 17:28:35,165 - INFO - Processing document 10-Q_2023-11-03
2025-11-14 17:28:35,783 - INFO - Finished converting document 10-Q_2023-11-03 in 0.97 sec.
2025-11-14 17:28:36,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-Q_2023-11-03' --> 'data\processed_data\PLTR\10-Q_2023-11-03.md'


2025-11-14 17:28:36,643 - INFO - Going to convert document batch...
2025-11-14 17:28:36,644 - INFO - Processing document 10-Q_2024-05-07
2025-11-14 17:28:37,106 - INFO - Finished converting document 10-Q_2024-05-07 in 1.06 sec.
2025-11-14 17:28:37,355 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-Q_2024-05-07' --> 'data\processed_data\PLTR\10-Q_2024-05-07.md'


2025-11-14 17:28:37,684 - INFO - Going to convert document batch...
2025-11-14 17:28:37,685 - INFO - Processing document 10-Q_2024-08-06
2025-11-14 17:28:38,301 - INFO - Finished converting document 10-Q_2024-08-06 in 0.98 sec.
2025-11-14 17:28:38,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-Q_2024-08-06' --> 'data\processed_data\PLTR\10-Q_2024-08-06.md'


2025-11-14 17:28:39,235 - INFO - Going to convert document batch...
2025-11-14 17:28:39,236 - INFO - Processing document 10-Q_2024-11-05
2025-11-14 17:28:39,881 - INFO - Finished converting document 10-Q_2024-11-05 in 1.30 sec.
2025-11-14 17:28:40,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-Q_2024-11-05' --> 'data\processed_data\PLTR\10-Q_2024-11-05.md'


2025-11-14 17:28:40,452 - INFO - Going to convert document batch...
2025-11-14 17:28:40,453 - INFO - Processing document 10-Q_2025-05-06
2025-11-14 17:28:40,944 - INFO - Finished converting document 10-Q_2025-05-06 in 0.77 sec.
2025-11-14 17:28:41,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-Q_2025-05-06' --> 'data\processed_data\PLTR\10-Q_2025-05-06.md'


2025-11-14 17:28:41,825 - INFO - Going to convert document batch...
2025-11-14 17:28:41,826 - INFO - Processing document 10-Q_2025-08-05
2025-11-14 17:28:42,431 - INFO - Finished converting document 10-Q_2025-08-05 in 1.27 sec.
2025-11-14 17:28:42,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\10-Q_2025-08-05' --> 'data\processed_data\PLTR\10-Q_2025-08-05.md'


2025-11-14 17:28:43,091 - INFO - Going to convert document batch...
2025-11-14 17:28:43,092 - INFO - Processing document 10-Q_2025-11-04
2025-11-14 17:28:43,729 - INFO - Finished converting document 10-Q_2025-11-04 in 1.03 sec.
2025-11-14 17:28:44,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,025 - INFO - Going to convert document batch...
2025-11-14 17:28:44,026 - INFO - Processing document 4_2023-01-05
2025-11-14 17:28:44,045 - INFO - Finished converting document 4_2023-01-05 in 0.05 sec.
2025-11-14 17:28:44,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,086 - INFO - Going to convert document batch...
2025-11-14 17:28:44,088 - INFO - Processing document 4_2023-02-17
2025-11-14 17:28:44,105 - INFO - Finished converting document 4_2023-02-17 in 0.05 sec.
2025-11-14 17:28:44,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,169 - INFO - Going to convert document batch...
2025-11-14 17:28:44,

Converted 'data\edgar_documents\PLTR\10-Q_2025-11-04' --> 'data\processed_data\PLTR\10-Q_2025-11-04.md'
Converted 'data\edgar_documents\PLTR\4_2023-01-05' --> 'data\processed_data\PLTR\4_2023-01-05.md'
Converted 'data\edgar_documents\PLTR\4_2023-02-17' --> 'data\processed_data\PLTR\4_2023-02-17.md'


2025-11-14 17:28:44,193 - INFO - Finished converting document 4_2023-02-22 in 0.06 sec.
2025-11-14 17:28:44,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,236 - INFO - Going to convert document batch...
2025-11-14 17:28:44,237 - INFO - Processing document 4_2023-02-23
2025-11-14 17:28:44,257 - INFO - Finished converting document 4_2023-02-23 in 0.03 sec.
2025-11-14 17:28:44,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,301 - INFO - Going to convert document batch...
2025-11-14 17:28:44,302 - INFO - Processing document 4_2023-02-24
2025-11-14 17:28:44,326 - INFO - Finished converting document 4_2023-02-24 in 0.05 sec.
2025-11-14 17:28:44,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,370 - INFO - Going to convert document batch...
2025-11-14 17:28:44,371 - INFO - Processing document 4_2023-02-28
2025-11-14 17:28:44,389 - INFO - Finished converting document 4_2023-02-28 in 0.05 sec.


Converted 'data\edgar_documents\PLTR\4_2023-02-22' --> 'data\processed_data\PLTR\4_2023-02-22.md'
Converted 'data\edgar_documents\PLTR\4_2023-02-23' --> 'data\processed_data\PLTR\4_2023-02-23.md'
Converted 'data\edgar_documents\PLTR\4_2023-02-24' --> 'data\processed_data\PLTR\4_2023-02-24.md'


2025-11-14 17:28:44,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,429 - INFO - Going to convert document batch...
2025-11-14 17:28:44,430 - INFO - Processing document 4_2023-03-03
2025-11-14 17:28:44,448 - INFO - Finished converting document 4_2023-03-03 in 0.05 sec.
2025-11-14 17:28:44,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,501 - INFO - Going to convert document batch...
2025-11-14 17:28:44,503 - INFO - Processing document 4_2023-03-17
2025-11-14 17:28:44,526 - INFO - Finished converting document 4_2023-03-17 in 0.06 sec.
2025-11-14 17:28:44,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,575 - INFO - Going to convert document batch...
2025-11-14 17:28:44,576 - INFO - Processing document 4_2023-04-05


Converted 'data\edgar_documents\PLTR\4_2023-02-28' --> 'data\processed_data\PLTR\4_2023-02-28.md'
Converted 'data\edgar_documents\PLTR\4_2023-03-03' --> 'data\processed_data\PLTR\4_2023-03-03.md'
Converted 'data\edgar_documents\PLTR\4_2023-03-17' --> 'data\processed_data\PLTR\4_2023-03-17.md'


2025-11-14 17:28:44,597 - INFO - Finished converting document 4_2023-04-05 in 0.05 sec.
2025-11-14 17:28:44,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,645 - INFO - Going to convert document batch...
2025-11-14 17:28:44,646 - INFO - Processing document 4_2023-05-03
2025-11-14 17:28:44,669 - INFO - Finished converting document 4_2023-05-03 in 0.05 sec.
2025-11-14 17:28:44,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,738 - INFO - Going to convert document batch...
2025-11-14 17:28:44,739 - INFO - Processing document 4_2023-05-12
2025-11-14 17:28:44,759 - INFO - Finished converting document 4_2023-05-12 in 0.06 sec.
2025-11-14 17:28:44,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,804 - INFO - Going to convert document batch...
2025-11-14 17:28:44,805 - INFO - Processing document 4_2023-05-19
2025-11-14 17:28:44,824 - INFO - Finished converting document 4_2023-05-19 in 0.05 sec.


Converted 'data\edgar_documents\PLTR\4_2023-04-05' --> 'data\processed_data\PLTR\4_2023-04-05.md'
Converted 'data\edgar_documents\PLTR\4_2023-05-03' --> 'data\processed_data\PLTR\4_2023-05-03.md'
Converted 'data\edgar_documents\PLTR\4_2023-05-12' --> 'data\processed_data\PLTR\4_2023-05-12.md'


2025-11-14 17:28:44,861 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,874 - INFO - Going to convert document batch...
2025-11-14 17:28:44,875 - INFO - Processing document 4_2023-05-23
2025-11-14 17:28:44,908 - INFO - Finished converting document 4_2023-05-23 in 0.06 sec.
2025-11-14 17:28:44,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:44,991 - INFO - Going to convert document batch...
2025-11-14 17:28:44,992 - INFO - Processing document 4_2023-05-24
2025-11-14 17:28:45,013 - INFO - Finished converting document 4_2023-05-24 in 0.06 sec.


Converted 'data\edgar_documents\PLTR\4_2023-05-19' --> 'data\processed_data\PLTR\4_2023-05-19.md'
Converted 'data\edgar_documents\PLTR\4_2023-05-23' --> 'data\processed_data\PLTR\4_2023-05-23.md'
Converted 'data\edgar_documents\PLTR\4_2023-05-24' --> 'data\processed_data\PLTR\4_2023-05-24.md'


2025-11-14 17:28:45,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:45,075 - INFO - Going to convert document batch...
2025-11-14 17:28:45,076 - INFO - Processing document 4_2023-06-01
2025-11-14 17:28:45,101 - INFO - Finished converting document 4_2023-06-01 in 0.06 sec.
2025-11-14 17:28:45,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:45,156 - INFO - Going to convert document batch...
2025-11-14 17:28:45,156 - INFO - Processing document 4_2023-06-07
2025-11-14 17:28:45,182 - INFO - Finished converting document 4_2023-06-07 in 0.06 sec.
2025-11-14 17:28:45,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:45,230 - INFO - Going to convert document batch...
2025-11-14 17:28:45,231 - INFO - Processing document 4_2023-06-09
2025-11-14 17:28:45,248 - INFO - Finished converting document 4_2023-06-09 in 0.05 sec.
2025-11-14 17:28:45,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\PLTR\4_2023-06-01' --> 'data\processed_data\PLTR\4_2023-06-01.md'
Converted 'data\edgar_documents\PLTR\4_2023-06-07' --> 'data\processed_data\PLTR\4_2023-06-07.md'
Converted 'data\edgar_documents\PLTR\4_2023-06-09' --> 'data\processed_data\PLTR\4_2023-06-09.md'


2025-11-14 17:28:45,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:45,361 - INFO - Going to convert document batch...
2025-11-14 17:28:45,362 - INFO - Processing document 4_2023-07-06
2025-11-14 17:28:45,390 - INFO - Finished converting document 4_2023-07-06 in 0.05 sec.
2025-11-14 17:28:45,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:45,457 - INFO - Going to convert document batch...
2025-11-14 17:28:45,458 - INFO - Processing document 4_2023-07-14


Converted 'data\edgar_documents\PLTR\4_2023-06-20' --> 'data\processed_data\PLTR\4_2023-06-20.md'
Converted 'data\edgar_documents\PLTR\4_2023-07-06' --> 'data\processed_data\PLTR\4_2023-07-06.md'


2025-11-14 17:28:45,800 - INFO - Finished converting document 4_2023-07-14 in 0.36 sec.
2025-11-14 17:28:45,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:45,846 - INFO - Going to convert document batch...
2025-11-14 17:28:45,847 - INFO - Processing document 4_2023-07-28
2025-11-14 17:28:45,871 - INFO - Finished converting document 4_2023-07-28 in 0.05 sec.
2025-11-14 17:28:45,904 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:45,919 - INFO - Going to convert document batch...
2025-11-14 17:28:45,920 - INFO - Processing document 4_2023-08-03
2025-11-14 17:28:45,953 - INFO - Finished converting document 4_2023-08-03 in 0.06 sec.
2025-11-14 17:28:45,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,003 - INFO - Going to convert document batch...
2025-11-14 17:28:46,004 - INFO - Processing document 4_2023-08-21


Converted 'data\edgar_documents\PLTR\4_2023-07-14' --> 'data\processed_data\PLTR\4_2023-07-14.md'
Converted 'data\edgar_documents\PLTR\4_2023-07-28' --> 'data\processed_data\PLTR\4_2023-07-28.md'
Converted 'data\edgar_documents\PLTR\4_2023-08-03' --> 'data\processed_data\PLTR\4_2023-08-03.md'


2025-11-14 17:28:46,025 - INFO - Finished converting document 4_2023-08-21 in 0.03 sec.
2025-11-14 17:28:46,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,068 - INFO - Going to convert document batch...
2025-11-14 17:28:46,069 - INFO - Processing document 4_2023-08-22
2025-11-14 17:28:46,107 - INFO - Finished converting document 4_2023-08-22 in 0.06 sec.
2025-11-14 17:28:46,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,168 - INFO - Going to convert document batch...
2025-11-14 17:28:46,168 - INFO - Processing document 4_2023-08-23
2025-11-14 17:28:46,191 - INFO - Finished converting document 4_2023-08-23 in 0.05 sec.
2025-11-14 17:28:46,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,233 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\4_2023-08-21' --> 'data\processed_data\PLTR\4_2023-08-21.md'
Converted 'data\edgar_documents\PLTR\4_2023-08-22' --> 'data\processed_data\PLTR\4_2023-08-22.md'
Converted 'data\edgar_documents\PLTR\4_2023-08-23' --> 'data\processed_data\PLTR\4_2023-08-23.md'


2025-11-14 17:28:46,234 - INFO - Processing document 4_2023-08-25
2025-11-14 17:28:46,253 - INFO - Finished converting document 4_2023-08-25 in 0.03 sec.
2025-11-14 17:28:46,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,299 - INFO - Going to convert document batch...
2025-11-14 17:28:46,300 - INFO - Processing document 4_2023-08-31
2025-11-14 17:28:46,324 - INFO - Finished converting document 4_2023-08-31 in 0.06 sec.
2025-11-14 17:28:46,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,367 - INFO - Going to convert document batch...
2025-11-14 17:28:46,368 - INFO - Processing document 4_2023-09-06
2025-11-14 17:28:46,388 - INFO - Finished converting document 4_2023-09-06 in 0.05 sec.
2025-11-14 17:28:46,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,433 - INFO - Going to convert document batch...
2025-11-14 17:28:46,433 - INFO - Processing document 4_2023-09-07


Converted 'data\edgar_documents\PLTR\4_2023-08-25' --> 'data\processed_data\PLTR\4_2023-08-25.md'
Converted 'data\edgar_documents\PLTR\4_2023-08-31' --> 'data\processed_data\PLTR\4_2023-08-31.md'
Converted 'data\edgar_documents\PLTR\4_2023-09-06' --> 'data\processed_data\PLTR\4_2023-09-06.md'


2025-11-14 17:28:46,456 - INFO - Finished converting document 4_2023-09-07 in 0.05 sec.
2025-11-14 17:28:46,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,506 - INFO - Going to convert document batch...
2025-11-14 17:28:46,508 - INFO - Processing document 4_2023-09-14
2025-11-14 17:28:46,553 - INFO - Finished converting document 4_2023-09-14 in 0.06 sec.
2025-11-14 17:28:46,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,598 - INFO - Going to convert document batch...
2025-11-14 17:28:46,598 - INFO - Processing document 4_2023-09-19
2025-11-14 17:28:46,618 - INFO - Finished converting document 4_2023-09-19 in 0.03 sec.
2025-11-14 17:28:46,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,657 - INFO - Going to convert document batch...
2025-11-14 17:28:46,658 - INFO - Processing document 4_2023-10-04
2025-11-14 17:28:46,676 - INFO - Finished converting document 4_2023-10-04 in 0.03 sec.


Converted 'data\edgar_documents\PLTR\4_2023-09-07' --> 'data\processed_data\PLTR\4_2023-09-07.md'
Converted 'data\edgar_documents\PLTR\4_2023-09-14' --> 'data\processed_data\PLTR\4_2023-09-14.md'
Converted 'data\edgar_documents\PLTR\4_2023-09-19' --> 'data\processed_data\PLTR\4_2023-09-19.md'


2025-11-14 17:28:46,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,718 - INFO - Going to convert document batch...
2025-11-14 17:28:46,718 - INFO - Processing document 4_2023-11-03
2025-11-14 17:28:46,740 - INFO - Finished converting document 4_2023-11-03 in 0.05 sec.
2025-11-14 17:28:46,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,783 - INFO - Going to convert document batch...
2025-11-14 17:28:46,784 - INFO - Processing document 4_2023-11-16
2025-11-14 17:28:46,805 - INFO - Finished converting document 4_2023-11-16 in 0.03 sec.
2025-11-14 17:28:46,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,848 - INFO - Going to convert document batch...
2025-11-14 17:28:46,849 - INFO - Processing document 4_2023-11-22
2025-11-14 17:28:46,872 - INFO - Finished converting document 4_2023-11-22 in 0.05 sec.


Converted 'data\edgar_documents\PLTR\4_2023-10-04' --> 'data\processed_data\PLTR\4_2023-10-04.md'
Converted 'data\edgar_documents\PLTR\4_2023-11-03' --> 'data\processed_data\PLTR\4_2023-11-03.md'
Converted 'data\edgar_documents\PLTR\4_2023-11-16' --> 'data\processed_data\PLTR\4_2023-11-16.md'


2025-11-14 17:28:46,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:46,916 - INFO - Going to convert document batch...
2025-11-14 17:28:46,917 - INFO - Processing document 4_2023-11-28
2025-11-14 17:28:46,940 - INFO - Finished converting document 4_2023-11-28 in 0.05 sec.
2025-11-14 17:28:47,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,014 - INFO - Going to convert document batch...
2025-11-14 17:28:47,015 - INFO - Processing document 4_2023-12-05
2025-11-14 17:28:47,031 - INFO - Finished converting document 4_2023-12-05 in 0.05 sec.
2025-11-14 17:28:47,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,072 - INFO - Going to convert document batch...
2025-11-14 17:28:47,073 - INFO - Processing document 4_2023-12-08


Converted 'data\edgar_documents\PLTR\4_2023-11-22' --> 'data\processed_data\PLTR\4_2023-11-22.md'
Converted 'data\edgar_documents\PLTR\4_2023-11-28' --> 'data\processed_data\PLTR\4_2023-11-28.md'
Converted 'data\edgar_documents\PLTR\4_2023-12-05' --> 'data\processed_data\PLTR\4_2023-12-05.md'


2025-11-14 17:28:47,094 - INFO - Finished converting document 4_2023-12-08 in 0.05 sec.
2025-11-14 17:28:47,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,137 - INFO - Going to convert document batch...
2025-11-14 17:28:47,137 - INFO - Processing document 4_2024-01-04
2025-11-14 17:28:47,156 - INFO - Finished converting document 4_2024-01-04 in 0.05 sec.
2025-11-14 17:28:47,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,202 - INFO - Going to convert document batch...
2025-11-14 17:28:47,203 - INFO - Processing document 4_2024-01-12
2025-11-14 17:28:47,230 - INFO - Finished converting document 4_2024-01-12 in 0.06 sec.
2025-11-14 17:28:47,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,275 - INFO - Going to convert document batch...
2025-11-14 17:28:47,275 - INFO - Processing document 4_2024-02-05
2025-11-14 17:28:47,293 - INFO - Finished converting document 4_2024-02-05 in 0.05 sec.


Converted 'data\edgar_documents\PLTR\4_2023-12-08' --> 'data\processed_data\PLTR\4_2023-12-08.md'
Converted 'data\edgar_documents\PLTR\4_2024-01-04' --> 'data\processed_data\PLTR\4_2024-01-04.md'
Converted 'data\edgar_documents\PLTR\4_2024-01-12' --> 'data\processed_data\PLTR\4_2024-01-12.md'


2025-11-14 17:28:47,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,337 - INFO - Going to convert document batch...
2025-11-14 17:28:47,338 - INFO - Processing document 4_2024-02-08
2025-11-14 17:28:47,381 - INFO - Finished converting document 4_2024-02-08 in 0.06 sec.
2025-11-14 17:28:47,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,454 - INFO - Going to convert document batch...
2025-11-14 17:28:47,455 - INFO - Processing document 4_2024-02-09
2025-11-14 17:28:47,481 - INFO - Finished converting document 4_2024-02-09 in 0.06 sec.


Converted 'data\edgar_documents\PLTR\4_2024-02-05' --> 'data\processed_data\PLTR\4_2024-02-05.md'
Converted 'data\edgar_documents\PLTR\4_2024-02-08' --> 'data\processed_data\PLTR\4_2024-02-08.md'


2025-11-14 17:28:47,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,538 - INFO - Going to convert document batch...
2025-11-14 17:28:47,539 - INFO - Processing document 4_2024-02-12
2025-11-14 17:28:47,593 - INFO - Finished converting document 4_2024-02-12 in 0.09 sec.
2025-11-14 17:28:47,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,671 - INFO - Going to convert document batch...
2025-11-14 17:28:47,672 - INFO - Processing document 4_2024-02-13
2025-11-14 17:28:47,690 - INFO - Finished converting document 4_2024-02-13 in 0.05 sec.


Converted 'data\edgar_documents\PLTR\4_2024-02-09' --> 'data\processed_data\PLTR\4_2024-02-09.md'
Converted 'data\edgar_documents\PLTR\4_2024-02-12' --> 'data\processed_data\PLTR\4_2024-02-12.md'


2025-11-14 17:28:47,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,731 - INFO - Going to convert document batch...
2025-11-14 17:28:47,732 - INFO - Processing document 4_2024-02-22
2025-11-14 17:28:47,757 - INFO - Finished converting document 4_2024-02-22 in 0.05 sec.
2025-11-14 17:28:47,793 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,801 - INFO - Going to convert document batch...
2025-11-14 17:28:47,801 - INFO - Processing document 4_2024-03-05
2025-11-14 17:28:47,819 - INFO - Finished converting document 4_2024-03-05 in 0.03 sec.
2025-11-14 17:28:47,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,863 - INFO - Going to convert document batch...
2025-11-14 17:28:47,863 - INFO - Processing document 4_2024-03-08
2025-11-14 17:28:47,886 - INFO - Finished converting document 4_2024-03-08 in 0.05 sec.


Converted 'data\edgar_documents\PLTR\4_2024-02-13' --> 'data\processed_data\PLTR\4_2024-02-13.md'
Converted 'data\edgar_documents\PLTR\4_2024-02-22' --> 'data\processed_data\PLTR\4_2024-02-22.md'
Converted 'data\edgar_documents\PLTR\4_2024-03-05' --> 'data\processed_data\PLTR\4_2024-03-05.md'


2025-11-14 17:28:47,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:47,931 - INFO - Going to convert document batch...
2025-11-14 17:28:47,932 - INFO - Processing document 4_2024-03-12
2025-11-14 17:28:47,959 - INFO - Finished converting document 4_2024-03-12 in 0.05 sec.
2025-11-14 17:28:48,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,032 - INFO - Going to convert document batch...
2025-11-14 17:28:48,033 - INFO - Processing document 4_2024-03-19
2025-11-14 17:28:48,059 - INFO - Finished converting document 4_2024-03-19 in 0.08 sec.


Converted 'data\edgar_documents\PLTR\4_2024-03-08' --> 'data\processed_data\PLTR\4_2024-03-08.md'
Converted 'data\edgar_documents\PLTR\4_2024-03-12' --> 'data\processed_data\PLTR\4_2024-03-12.md'
Converted 'data\edgar_documents\PLTR\4_2024-03-19' --> 'data\processed_data\PLTR\4_2024-03-19.md'


2025-11-14 17:28:48,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,120 - INFO - Going to convert document batch...
2025-11-14 17:28:48,121 - INFO - Processing document 4_2024-04-02
2025-11-14 17:28:48,138 - INFO - Finished converting document 4_2024-04-02 in 0.06 sec.
2025-11-14 17:28:48,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,180 - INFO - Going to convert document batch...
2025-11-14 17:28:48,181 - INFO - Processing document 4_2024-04-03
2025-11-14 17:28:48,200 - INFO - Finished converting document 4_2024-04-03 in 0.05 sec.
2025-11-14 17:28:48,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,242 - INFO - Going to convert document batch...
2025-11-14 17:28:48,242 - INFO - Processing document 4_2024-04-16
2025-11-14 17:28:48,264 - INFO - Finished converting document 4_2024-04-16 in 0.05 sec.
2025-11-14 17:28:48,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\PLTR\4_2024-04-02' --> 'data\processed_data\PLTR\4_2024-04-02.md'
Converted 'data\edgar_documents\PLTR\4_2024-04-03' --> 'data\processed_data\PLTR\4_2024-04-03.md'
Converted 'data\edgar_documents\PLTR\4_2024-04-16' --> 'data\processed_data\PLTR\4_2024-04-16.md'
Converted 'data\edgar_documents\PLTR\4_2024-04-19' --> 'data\processed_data\PLTR\4_2024-04-19.md'


2025-11-14 17:28:48,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,394 - INFO - Going to convert document batch...
2025-11-14 17:28:48,394 - INFO - Processing document 4_2024-04-24
2025-11-14 17:28:48,414 - INFO - Finished converting document 4_2024-04-24 in 0.06 sec.
2025-11-14 17:28:48,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,457 - INFO - Going to convert document batch...
2025-11-14 17:28:48,458 - INFO - Processing document 4_2024-05-03
2025-11-14 17:28:48,479 - INFO - Finished converting document 4_2024-05-03 in 0.05 sec.
2025-11-14 17:28:48,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,545 - INFO - Going to convert document batch...
2025-11-14 17:28:48,546 - INFO - Processing document 4_2024-05-10
2025-11-14 17:28:48,570 - INFO - Finished converting document 4_2024-05-10 in 0.06 sec.
2025-11-14 17:28:48,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\4_2024-04-24' --> 'data\processed_data\PLTR\4_2024-04-24.md'
Converted 'data\edgar_documents\PLTR\4_2024-05-03' --> 'data\processed_data\PLTR\4_2024-05-03.md'
Converted 'data\edgar_documents\PLTR\4_2024-05-10' --> 'data\processed_data\PLTR\4_2024-05-10.md'


2025-11-14 17:28:48,644 - INFO - Going to convert document batch...
2025-11-14 17:28:48,646 - INFO - Processing document 4_2024-05-22
2025-11-14 17:28:48,671 - INFO - Finished converting document 4_2024-05-22 in 0.08 sec.
2025-11-14 17:28:48,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,718 - INFO - Going to convert document batch...
2025-11-14 17:28:48,719 - INFO - Processing document 4_2024-05-28
2025-11-14 17:28:48,745 - INFO - Finished converting document 4_2024-05-28 in 0.06 sec.
2025-11-14 17:28:48,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,809 - INFO - Going to convert document batch...
2025-11-14 17:28:48,810 - INFO - Processing document 4_2024-06-04
2025-11-14 17:28:48,830 - INFO - Finished converting document 4_2024-06-04 in 0.06 sec.


Converted 'data\edgar_documents\PLTR\4_2024-05-22' --> 'data\processed_data\PLTR\4_2024-05-22.md'
Converted 'data\edgar_documents\PLTR\4_2024-05-28' --> 'data\processed_data\PLTR\4_2024-05-28.md'
Converted 'data\edgar_documents\PLTR\4_2024-06-04' --> 'data\processed_data\PLTR\4_2024-06-04.md'


2025-11-14 17:28:48,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,886 - INFO - Going to convert document batch...
2025-11-14 17:28:48,887 - INFO - Processing document 4_2024-06-07
2025-11-14 17:28:48,909 - INFO - Finished converting document 4_2024-06-07 in 0.06 sec.
2025-11-14 17:28:48,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:48,955 - INFO - Going to convert document batch...
2025-11-14 17:28:48,956 - INFO - Processing document 4_2024-06-10
2025-11-14 17:28:48,984 - INFO - Finished converting document 4_2024-06-10 in 0.05 sec.
2025-11-14 17:28:49,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,064 - INFO - Going to convert document batch...
2025-11-14 17:28:49,065 - INFO - Processing document 4_2024-06-13
2025-11-14 17:28:49,085 - INFO - Finished converting document 4_2024-06-13 in 0.06 sec.
2025-11-14 17:28:49,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\PLTR\4_2024-06-07' --> 'data\processed_data\PLTR\4_2024-06-07.md'
Converted 'data\edgar_documents\PLTR\4_2024-06-10' --> 'data\processed_data\PLTR\4_2024-06-10.md'
Converted 'data\edgar_documents\PLTR\4_2024-06-13' --> 'data\processed_data\PLTR\4_2024-06-13.md'


2025-11-14 17:28:49,125 - INFO - Processing document 4_2024-06-14
2025-11-14 17:28:49,143 - INFO - Finished converting document 4_2024-06-14 in 0.03 sec.
2025-11-14 17:28:49,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,198 - INFO - Going to convert document batch...
2025-11-14 17:28:49,200 - INFO - Processing document 4_2024-06-20
2025-11-14 17:28:49,225 - INFO - Finished converting document 4_2024-06-20 in 0.06 sec.
2025-11-14 17:28:49,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,267 - INFO - Going to convert document batch...
2025-11-14 17:28:49,267 - INFO - Processing document 4_2024-06-21
2025-11-14 17:28:49,286 - INFO - Finished converting document 4_2024-06-21 in 0.03 sec.
2025-11-14 17:28:49,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,347 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\4_2024-06-14' --> 'data\processed_data\PLTR\4_2024-06-14.md'
Converted 'data\edgar_documents\PLTR\4_2024-06-20' --> 'data\processed_data\PLTR\4_2024-06-20.md'
Converted 'data\edgar_documents\PLTR\4_2024-06-21' --> 'data\processed_data\PLTR\4_2024-06-21.md'


2025-11-14 17:28:49,348 - INFO - Processing document 4_2024-07-02
2025-11-14 17:28:49,365 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.
2025-11-14 17:28:49,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,433 - INFO - Going to convert document batch...
2025-11-14 17:28:49,435 - INFO - Processing document 4_2024-07-08
2025-11-14 17:28:49,459 - INFO - Finished converting document 4_2024-07-08 in 0.06 sec.
2025-11-14 17:28:49,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,503 - INFO - Going to convert document batch...
2025-11-14 17:28:49,504 - INFO - Processing document 4_2024-07-11
2025-11-14 17:28:49,526 - INFO - Finished converting document 4_2024-07-11 in 0.05 sec.
2025-11-14 17:28:49,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,569 - INFO - Going to convert document batch...
2025-11-14 17:28:49,570 - INFO - Processing document 4_2024-07-12
2025-11-14 17:28:49,589 - IN

Converted 'data\edgar_documents\PLTR\4_2024-07-02' --> 'data\processed_data\PLTR\4_2024-07-02.md'
Converted 'data\edgar_documents\PLTR\4_2024-07-08' --> 'data\processed_data\PLTR\4_2024-07-08.md'
Converted 'data\edgar_documents\PLTR\4_2024-07-11' --> 'data\processed_data\PLTR\4_2024-07-11.md'


2025-11-14 17:28:49,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,649 - INFO - Going to convert document batch...
2025-11-14 17:28:49,650 - INFO - Processing document 4_2024-07-16
2025-11-14 17:28:49,672 - INFO - Finished converting document 4_2024-07-16 in 0.06 sec.
2025-11-14 17:28:49,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,715 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\4_2024-07-12' --> 'data\processed_data\PLTR\4_2024-07-12.md'
Converted 'data\edgar_documents\PLTR\4_2024-07-16' --> 'data\processed_data\PLTR\4_2024-07-16.md'


2025-11-14 17:28:49,931 - INFO - Processing document 4_2024-07-17
2025-11-14 17:28:49,952 - INFO - Finished converting document 4_2024-07-17 in 0.27 sec.
2025-11-14 17:28:49,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:49,996 - INFO - Going to convert document batch...
2025-11-14 17:28:49,997 - INFO - Processing document 4_2024-07-19
2025-11-14 17:28:50,018 - INFO - Finished converting document 4_2024-07-19 in 0.05 sec.
2025-11-14 17:28:50,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,062 - INFO - Going to convert document batch...
2025-11-14 17:28:50,063 - INFO - Processing document 4_2024-07-22
2025-11-14 17:28:50,086 - INFO - Finished converting document 4_2024-07-22 in 0.05 sec.
2025-11-14 17:28:50,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,130 - INFO - Going to convert document batch...
2025-11-14 17:28:50,131 - INFO - Processing document 4_2024-07-24
2025-11-14 17:28:50,148 - IN

Converted 'data\edgar_documents\PLTR\4_2024-07-17' --> 'data\processed_data\PLTR\4_2024-07-17.md'
Converted 'data\edgar_documents\PLTR\4_2024-07-19' --> 'data\processed_data\PLTR\4_2024-07-19.md'
Converted 'data\edgar_documents\PLTR\4_2024-07-22' --> 'data\processed_data\PLTR\4_2024-07-22.md'


2025-11-14 17:28:50,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,188 - INFO - Going to convert document batch...
2025-11-14 17:28:50,189 - INFO - Processing document 4_2024-07-30
2025-11-14 17:28:50,211 - INFO - Finished converting document 4_2024-07-30 in 0.03 sec.
2025-11-14 17:28:50,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,265 - INFO - Going to convert document batch...
2025-11-14 17:28:50,266 - INFO - Processing document 4_2024-08-02
2025-11-14 17:28:50,286 - INFO - Finished converting document 4_2024-08-02 in 0.05 sec.
2025-11-14 17:28:50,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,330 - INFO - Going to convert document batch...
2025-11-14 17:28:50,330 - INFO - Processing document 4_2024-08-05
2025-11-14 17:28:50,350 - INFO - Finished converting document 4_2024-08-05 in 0.03 sec.


Converted 'data\edgar_documents\PLTR\4_2024-07-24' --> 'data\processed_data\PLTR\4_2024-07-24.md'
Converted 'data\edgar_documents\PLTR\4_2024-07-30' --> 'data\processed_data\PLTR\4_2024-07-30.md'
Converted 'data\edgar_documents\PLTR\4_2024-08-02' --> 'data\processed_data\PLTR\4_2024-08-02.md'


2025-11-14 17:28:50,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,392 - INFO - Going to convert document batch...
2025-11-14 17:28:50,393 - INFO - Processing document 4_2024-08-07
2025-11-14 17:28:50,435 - INFO - Finished converting document 4_2024-08-07 in 0.06 sec.
2025-11-14 17:28:50,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,487 - INFO - Going to convert document batch...
2025-11-14 17:28:50,488 - INFO - Processing document 4_2024-08-12
2025-11-14 17:28:50,513 - INFO - Finished converting document 4_2024-08-12 in 0.05 sec.
2025-11-14 17:28:50,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,556 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\4_2024-08-05' --> 'data\processed_data\PLTR\4_2024-08-05.md'
Converted 'data\edgar_documents\PLTR\4_2024-08-07' --> 'data\processed_data\PLTR\4_2024-08-07.md'
Converted 'data\edgar_documents\PLTR\4_2024-08-12' --> 'data\processed_data\PLTR\4_2024-08-12.md'


2025-11-14 17:28:50,557 - INFO - Processing document 4_2024-08-13
2025-11-14 17:28:50,580 - INFO - Finished converting document 4_2024-08-13 in 0.05 sec.
2025-11-14 17:28:50,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,630 - INFO - Going to convert document batch...
2025-11-14 17:28:50,631 - INFO - Processing document 4_2024-08-14
2025-11-14 17:28:50,671 - INFO - Finished converting document 4_2024-08-14 in 0.08 sec.
2025-11-14 17:28:50,711 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,719 - INFO - Going to convert document batch...
2025-11-14 17:28:50,720 - INFO - Processing document 4_2024-08-15
2025-11-14 17:28:50,740 - INFO - Finished converting document 4_2024-08-15 in 0.03 sec.
2025-11-14 17:28:50,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,781 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\4_2024-08-13' --> 'data\processed_data\PLTR\4_2024-08-13.md'
Converted 'data\edgar_documents\PLTR\4_2024-08-14' --> 'data\processed_data\PLTR\4_2024-08-14.md'
Converted 'data\edgar_documents\PLTR\4_2024-08-15' --> 'data\processed_data\PLTR\4_2024-08-15.md'


2025-11-14 17:28:50,781 - INFO - Processing document 4_2024-08-20
2025-11-14 17:28:50,803 - INFO - Finished converting document 4_2024-08-20 in 0.03 sec.
2025-11-14 17:28:50,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,850 - INFO - Going to convert document batch...
2025-11-14 17:28:50,850 - INFO - Processing document 4_2024-08-22
2025-11-14 17:28:50,873 - INFO - Finished converting document 4_2024-08-22 in 0.05 sec.
2025-11-14 17:28:50,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:50,916 - INFO - Going to convert document batch...
2025-11-14 17:28:50,917 - INFO - Processing document 4_2024-08-26
2025-11-14 17:28:50,937 - INFO - Finished converting document 4_2024-08-26 in 0.05 sec.
2025-11-14 17:28:50,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,001 - INFO - Going to convert document batch...
2025-11-14 17:28:51,002 - INFO - Processing document 4_2024-08-29
2025-11-14 17:28:51,025 - IN

Converted 'data\edgar_documents\PLTR\4_2024-08-20' --> 'data\processed_data\PLTR\4_2024-08-20.md'
Converted 'data\edgar_documents\PLTR\4_2024-08-22' --> 'data\processed_data\PLTR\4_2024-08-22.md'
Converted 'data\edgar_documents\PLTR\4_2024-08-26' --> 'data\processed_data\PLTR\4_2024-08-26.md'


2025-11-14 17:28:51,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,067 - INFO - Going to convert document batch...
2025-11-14 17:28:51,068 - INFO - Processing document 4_2024-09-03
2025-11-14 17:28:51,087 - INFO - Finished converting document 4_2024-09-03 in 0.03 sec.
2025-11-14 17:28:51,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,154 - INFO - Going to convert document batch...
2025-11-14 17:28:51,155 - INFO - Processing document 4_2024-09-04
2025-11-14 17:28:51,181 - INFO - Finished converting document 4_2024-09-04 in 0.06 sec.
2025-11-14 17:28:51,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,224 - INFO - Going to convert document batch...
2025-11-14 17:28:51,224 - INFO - Processing document 4_2024-09-05


Converted 'data\edgar_documents\PLTR\4_2024-08-29' --> 'data\processed_data\PLTR\4_2024-08-29.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-03' --> 'data\processed_data\PLTR\4_2024-09-03.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-04' --> 'data\processed_data\PLTR\4_2024-09-04.md'


2025-11-14 17:28:51,245 - INFO - Finished converting document 4_2024-09-05 in 0.05 sec.
2025-11-14 17:28:51,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,289 - INFO - Going to convert document batch...
2025-11-14 17:28:51,290 - INFO - Processing document 4_2024-09-09
2025-11-14 17:28:51,311 - INFO - Finished converting document 4_2024-09-09 in 0.05 sec.
2025-11-14 17:28:51,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,354 - INFO - Going to convert document batch...
2025-11-14 17:28:51,355 - INFO - Processing document 4_2024-09-11
2025-11-14 17:28:51,374 - INFO - Finished converting document 4_2024-09-11 in 0.05 sec.
2025-11-14 17:28:51,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,415 - INFO - Going to convert document batch...
2025-11-14 17:28:51,416 - INFO - Processing document 4_2024-09-12
2025-11-14 17:28:51,436 - INFO - Finished converting document 4_2024-09-12 in 0.05 sec.


Converted 'data\edgar_documents\PLTR\4_2024-09-05' --> 'data\processed_data\PLTR\4_2024-09-05.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-09' --> 'data\processed_data\PLTR\4_2024-09-09.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-11' --> 'data\processed_data\PLTR\4_2024-09-11.md'


2025-11-14 17:28:51,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,482 - INFO - Going to convert document batch...
2025-11-14 17:28:51,483 - INFO - Processing document 4_2024-09-16
2025-11-14 17:28:51,507 - INFO - Finished converting document 4_2024-09-16 in 0.05 sec.
2025-11-14 17:28:51,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,561 - INFO - Going to convert document batch...
2025-11-14 17:28:51,562 - INFO - Processing document 4_2024-09-17
2025-11-14 17:28:51,596 - INFO - Finished converting document 4_2024-09-17 in 0.06 sec.
2025-11-14 17:28:51,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\4_2024-09-12' --> 'data\processed_data\PLTR\4_2024-09-12.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-16' --> 'data\processed_data\PLTR\4_2024-09-16.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-17' --> 'data\processed_data\PLTR\4_2024-09-17.md'


2025-11-14 17:28:51,666 - INFO - Going to convert document batch...
2025-11-14 17:28:51,667 - INFO - Processing document 4_2024-09-18
2025-11-14 17:28:51,691 - INFO - Finished converting document 4_2024-09-18 in 0.06 sec.
2025-11-14 17:28:51,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,747 - INFO - Going to convert document batch...
2025-11-14 17:28:51,748 - INFO - Processing document 4_2024-09-19
2025-11-14 17:28:51,771 - INFO - Finished converting document 4_2024-09-19 in 0.05 sec.
2025-11-14 17:28:51,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,814 - INFO - Going to convert document batch...
2025-11-14 17:28:51,815 - INFO - Processing document 4_2024-09-20
2025-11-14 17:28:51,835 - INFO - Finished converting document 4_2024-09-20 in 0.03 sec.
2025-11-14 17:28:51,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,880 - INFO - Going to convert document batch...
2025-11-14 17:28:51,880 - 

Converted 'data\edgar_documents\PLTR\4_2024-09-18' --> 'data\processed_data\PLTR\4_2024-09-18.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-19' --> 'data\processed_data\PLTR\4_2024-09-19.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-20' --> 'data\processed_data\PLTR\4_2024-09-20.md'


2025-11-14 17:28:51,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:51,946 - INFO - Going to convert document batch...
2025-11-14 17:28:51,947 - INFO - Processing document 4_2024-09-25
2025-11-14 17:28:51,969 - INFO - Finished converting document 4_2024-09-25 in 0.05 sec.
2025-11-14 17:28:52,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,017 - INFO - Going to convert document batch...
2025-11-14 17:28:52,018 - INFO - Processing document 4_2024-09-26
2025-11-14 17:28:52,068 - INFO - Finished converting document 4_2024-09-26 in 0.08 sec.
2025-11-14 17:28:52,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\4_2024-09-24' --> 'data\processed_data\PLTR\4_2024-09-24.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-25' --> 'data\processed_data\PLTR\4_2024-09-25.md'
Converted 'data\edgar_documents\PLTR\4_2024-09-26' --> 'data\processed_data\PLTR\4_2024-09-26.md'


2025-11-14 17:28:52,121 - INFO - Going to convert document batch...
2025-11-14 17:28:52,122 - INFO - Processing document 4_2024-09-27
2025-11-14 17:28:52,143 - INFO - Finished converting document 4_2024-09-27 in 0.05 sec.
2025-11-14 17:28:52,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,195 - INFO - Going to convert document batch...
2025-11-14 17:28:52,195 - INFO - Processing document 4_2024-10-01
2025-11-14 17:28:52,227 - INFO - Finished converting document 4_2024-10-01 in 0.05 sec.
2025-11-14 17:28:52,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,278 - INFO - Going to convert document batch...
2025-11-14 17:28:52,279 - INFO - Processing document 4_2024-10-02
2025-11-14 17:28:52,296 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.
2025-11-14 17:28:52,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,357 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\4_2024-09-27' --> 'data\processed_data\PLTR\4_2024-09-27.md'
Converted 'data\edgar_documents\PLTR\4_2024-10-01' --> 'data\processed_data\PLTR\4_2024-10-01.md'
Converted 'data\edgar_documents\PLTR\4_2024-10-02' --> 'data\processed_data\PLTR\4_2024-10-02.md'


2025-11-14 17:28:52,358 - INFO - Processing document 4_2024-10-03
2025-11-14 17:28:52,379 - INFO - Finished converting document 4_2024-10-03 in 0.06 sec.
2025-11-14 17:28:52,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,423 - INFO - Going to convert document batch...
2025-11-14 17:28:52,424 - INFO - Processing document 4_2024-10-04
2025-11-14 17:28:52,444 - INFO - Finished converting document 4_2024-10-04 in 0.03 sec.
2025-11-14 17:28:52,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,487 - INFO - Going to convert document batch...
2025-11-14 17:28:52,488 - INFO - Processing document 4_2024-10-07
2025-11-14 17:28:52,517 - INFO - Finished converting document 4_2024-10-07 in 0.05 sec.
2025-11-14 17:28:52,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,571 - INFO - Going to convert document batch...
2025-11-14 17:28:52,571 - INFO - Processing document 4_2024-10-08
2025-11-14 17:28:52,592 - IN

Converted 'data\edgar_documents\PLTR\4_2024-10-03' --> 'data\processed_data\PLTR\4_2024-10-03.md'
Converted 'data\edgar_documents\PLTR\4_2024-10-04' --> 'data\processed_data\PLTR\4_2024-10-04.md'
Converted 'data\edgar_documents\PLTR\4_2024-10-07' --> 'data\processed_data\PLTR\4_2024-10-07.md'


2025-11-14 17:28:52,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,634 - INFO - Going to convert document batch...
2025-11-14 17:28:52,636 - INFO - Processing document 4_2024-10-15
2025-11-14 17:28:52,656 - INFO - Finished converting document 4_2024-10-15 in 0.05 sec.
2025-11-14 17:28:52,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,739 - INFO - Going to convert document batch...
2025-11-14 17:28:52,739 - INFO - Processing document 4_2024-10-29
2025-11-14 17:28:52,762 - INFO - Finished converting document 4_2024-10-29 in 0.06 sec.
2025-11-14 17:28:52,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\4_2024-10-08' --> 'data\processed_data\PLTR\4_2024-10-08.md'
Converted 'data\edgar_documents\PLTR\4_2024-10-15' --> 'data\processed_data\PLTR\4_2024-10-15.md'
Converted 'data\edgar_documents\PLTR\4_2024-10-29' --> 'data\processed_data\PLTR\4_2024-10-29.md'


2025-11-14 17:28:52,805 - INFO - Going to convert document batch...
2025-11-14 17:28:52,806 - INFO - Processing document 4_2024-11-01
2025-11-14 17:28:52,827 - INFO - Finished converting document 4_2024-11-01 in 0.05 sec.
2025-11-14 17:28:52,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,872 - INFO - Going to convert document batch...
2025-11-14 17:28:52,873 - INFO - Processing document 4_2024-11-05
2025-11-14 17:28:52,894 - INFO - Finished converting document 4_2024-11-05 in 0.05 sec.
2025-11-14 17:28:52,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:52,938 - INFO - Going to convert document batch...
2025-11-14 17:28:52,939 - INFO - Processing document 4_2024-11-06
2025-11-14 17:28:52,960 - INFO - Finished converting document 4_2024-11-06 in 0.03 sec.
2025-11-14 17:28:52,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:53,002 - INFO - Going to convert document batch...
2025-11-14 17:28:53,003 - 

Converted 'data\edgar_documents\PLTR\4_2024-11-01' --> 'data\processed_data\PLTR\4_2024-11-01.md'
Converted 'data\edgar_documents\PLTR\4_2024-11-05' --> 'data\processed_data\PLTR\4_2024-11-05.md'
Converted 'data\edgar_documents\PLTR\4_2024-11-06' --> 'data\processed_data\PLTR\4_2024-11-06.md'


2025-11-14 17:28:53,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:53,061 - INFO - Going to convert document batch...
2025-11-14 17:28:53,061 - INFO - Processing document 4_2024-11-12
2025-11-14 17:28:53,083 - INFO - Finished converting document 4_2024-11-12 in 0.03 sec.
2025-11-14 17:28:53,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:53,174 - INFO - Going to convert document batch...
2025-11-14 17:28:53,175 - INFO - Processing document 4_2024-11-15
2025-11-14 17:28:53,217 - INFO - Finished converting document 4_2024-11-15 in 0.09 sec.


Converted 'data\edgar_documents\PLTR\4_2024-11-07' --> 'data\processed_data\PLTR\4_2024-11-07.md'
Converted 'data\edgar_documents\PLTR\4_2024-11-12' --> 'data\processed_data\PLTR\4_2024-11-12.md'


2025-11-14 17:28:53,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:53,285 - INFO - Going to convert document batch...
2025-11-14 17:28:53,287 - INFO - Processing document 4_2024-11-20
2025-11-14 17:28:53,344 - INFO - Finished converting document 4_2024-11-20 in 0.09 sec.
2025-11-14 17:28:53,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:53,413 - INFO - Going to convert document batch...
2025-11-14 17:28:53,413 - INFO - Processing document 4_2024-11-22
2025-11-14 17:28:53,441 - INFO - Finished converting document 4_2024-11-22 in 0.05 sec.


Converted 'data\edgar_documents\PLTR\4_2024-11-15' --> 'data\processed_data\PLTR\4_2024-11-15.md'
Converted 'data\edgar_documents\PLTR\4_2024-11-20' --> 'data\processed_data\PLTR\4_2024-11-20.md'


2025-11-14 17:28:53,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:53,489 - INFO - Going to convert document batch...
2025-11-14 17:28:53,490 - INFO - Processing document 4_2024-11-27
2025-11-14 17:28:53,512 - INFO - Finished converting document 4_2024-11-27 in 0.05 sec.
2025-11-14 17:28:53,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:53,581 - INFO - Going to convert document batch...
2025-11-14 17:28:53,582 - INFO - Processing document 4_2024-12-03
2025-11-14 17:28:53,634 - INFO - Finished converting document 4_2024-12-03 in 0.09 sec.


Converted 'data\edgar_documents\PLTR\4_2024-11-22' --> 'data\processed_data\PLTR\4_2024-11-22.md'
Converted 'data\edgar_documents\PLTR\4_2024-11-27' --> 'data\processed_data\PLTR\4_2024-11-27.md'


2025-11-14 17:28:53,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:53,691 - INFO - Going to convert document batch...
2025-11-14 17:28:53,692 - INFO - Processing document 4_2024-12-04
2025-11-14 17:28:53,711 - INFO - Finished converting document 4_2024-12-04 in 0.03 sec.
2025-11-14 17:28:53,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\4_2024-12-03' --> 'data\processed_data\PLTR\4_2024-12-03.md'
Converted 'data\edgar_documents\PLTR\4_2024-12-04' --> 'data\processed_data\PLTR\4_2024-12-04.md'


2025-11-14 17:28:53,967 - INFO - Going to convert document batch...
2025-11-14 17:28:53,968 - INFO - Processing document 4_2024-12-06
2025-11-14 17:28:53,991 - INFO - Finished converting document 4_2024-12-06 in 0.25 sec.
2025-11-14 17:28:54,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,041 - INFO - Going to convert document batch...
2025-11-14 17:28:54,042 - INFO - Processing document 4_2024-12-10
2025-11-14 17:28:54,063 - INFO - Finished converting document 4_2024-12-10 in 0.05 sec.
2025-11-14 17:28:54,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,101 - INFO - Going to convert document batch...
2025-11-14 17:28:54,102 - INFO - Processing document 4_2024-12-11
2025-11-14 17:28:54,121 - INFO - Finished converting document 4_2024-12-11 in 0.05 sec.
2025-11-14 17:28:54,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,160 - INFO - Going to convert document batch...
2025-11-14 17:28:54,161 - 

Converted 'data\edgar_documents\PLTR\4_2024-12-06' --> 'data\processed_data\PLTR\4_2024-12-06.md'
Converted 'data\edgar_documents\PLTR\4_2024-12-10' --> 'data\processed_data\PLTR\4_2024-12-10.md'
Converted 'data\edgar_documents\PLTR\4_2024-12-11' --> 'data\processed_data\PLTR\4_2024-12-11.md'


2025-11-14 17:28:54,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,224 - INFO - Going to convert document batch...
2025-11-14 17:28:54,225 - INFO - Processing document 4_2024-12-16
2025-11-14 17:28:54,252 - INFO - Finished converting document 4_2024-12-16 in 0.05 sec.
2025-11-14 17:28:54,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,327 - INFO - Going to convert document batch...
2025-11-14 17:28:54,328 - INFO - Processing document 4_2025-01-06
2025-11-14 17:28:54,351 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 17:28:54,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\4_2024-12-13' --> 'data\processed_data\PLTR\4_2024-12-13.md'
Converted 'data\edgar_documents\PLTR\4_2024-12-16' --> 'data\processed_data\PLTR\4_2024-12-16.md'
Converted 'data\edgar_documents\PLTR\4_2025-01-06' --> 'data\processed_data\PLTR\4_2025-01-06.md'


2025-11-14 17:28:54,394 - INFO - Going to convert document batch...
2025-11-14 17:28:54,395 - INFO - Processing document 4_2025-01-10
2025-11-14 17:28:54,421 - INFO - Finished converting document 4_2025-01-10 in 0.05 sec.
2025-11-14 17:28:54,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,475 - INFO - Going to convert document batch...
2025-11-14 17:28:54,475 - INFO - Processing document 4_2025-02-05
2025-11-14 17:28:54,505 - INFO - Finished converting document 4_2025-02-05 in 0.05 sec.
2025-11-14 17:28:54,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,567 - INFO - Going to convert document batch...
2025-11-14 17:28:54,568 - INFO - Processing document 4_2025-02-06
2025-11-14 17:28:54,585 - INFO - Finished converting document 4_2025-02-06 in 0.05 sec.
2025-11-14 17:28:54,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,643 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\4_2025-01-10' --> 'data\processed_data\PLTR\4_2025-01-10.md'
Converted 'data\edgar_documents\PLTR\4_2025-02-05' --> 'data\processed_data\PLTR\4_2025-02-05.md'
Converted 'data\edgar_documents\PLTR\4_2025-02-06' --> 'data\processed_data\PLTR\4_2025-02-06.md'


2025-11-14 17:28:54,643 - INFO - Processing document 4_2025-02-13
2025-11-14 17:28:54,667 - INFO - Finished converting document 4_2025-02-13 in 0.06 sec.
2025-11-14 17:28:54,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,734 - INFO - Going to convert document batch...
2025-11-14 17:28:54,735 - INFO - Processing document 4_2025-02-24
2025-11-14 17:28:54,764 - INFO - Finished converting document 4_2025-02-24 in 0.06 sec.
2025-11-14 17:28:54,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,827 - INFO - Going to convert document batch...
2025-11-14 17:28:54,828 - INFO - Processing document 4_2025-03-05
2025-11-14 17:28:54,858 - INFO - Finished converting document 4_2025-03-05 in 0.08 sec.
2025-11-14 17:28:54,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\4_2025-02-13' --> 'data\processed_data\PLTR\4_2025-02-13.md'
Converted 'data\edgar_documents\PLTR\4_2025-02-24' --> 'data\processed_data\PLTR\4_2025-02-24.md'
Converted 'data\edgar_documents\PLTR\4_2025-03-05' --> 'data\processed_data\PLTR\4_2025-03-05.md'


2025-11-14 17:28:54,908 - INFO - Going to convert document batch...
2025-11-14 17:28:54,909 - INFO - Processing document 4_2025-03-07
2025-11-14 17:28:54,938 - INFO - Finished converting document 4_2025-03-07 in 0.06 sec.
2025-11-14 17:28:54,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:54,986 - INFO - Going to convert document batch...
2025-11-14 17:28:54,987 - INFO - Processing document 4_2025-03-11
2025-11-14 17:28:55,008 - INFO - Finished converting document 4_2025-03-11 in 0.03 sec.
2025-11-14 17:28:55,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,066 - INFO - Going to convert document batch...
2025-11-14 17:28:55,067 - INFO - Processing document 4_2025-03-14
2025-11-14 17:28:55,139 - INFO - Finished converting document 4_2025-03-14 in 0.11 sec.


Converted 'data\edgar_documents\PLTR\4_2025-03-07' --> 'data\processed_data\PLTR\4_2025-03-07.md'
Converted 'data\edgar_documents\PLTR\4_2025-03-11' --> 'data\processed_data\PLTR\4_2025-03-11.md'


2025-11-14 17:28:55,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,220 - INFO - Going to convert document batch...
2025-11-14 17:28:55,221 - INFO - Processing document 4_2025-03-19
2025-11-14 17:28:55,259 - INFO - Finished converting document 4_2025-03-19 in 0.06 sec.
2025-11-14 17:28:55,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,312 - INFO - Going to convert document batch...
2025-11-14 17:28:55,312 - INFO - Processing document 4_2025-03-26
2025-11-14 17:28:55,330 - INFO - Finished converting document 4_2025-03-26 in 0.03 sec.
2025-11-14 17:28:55,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,372 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\4_2025-03-14' --> 'data\processed_data\PLTR\4_2025-03-14.md'
Converted 'data\edgar_documents\PLTR\4_2025-03-19' --> 'data\processed_data\PLTR\4_2025-03-19.md'
Converted 'data\edgar_documents\PLTR\4_2025-03-26' --> 'data\processed_data\PLTR\4_2025-03-26.md'


2025-11-14 17:28:55,372 - INFO - Processing document 4_2025-03-27
2025-11-14 17:28:55,391 - INFO - Finished converting document 4_2025-03-27 in 0.05 sec.
2025-11-14 17:28:55,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,448 - INFO - Going to convert document batch...
2025-11-14 17:28:55,449 - INFO - Processing document 4_2025-04-02
2025-11-14 17:28:55,501 - INFO - Finished converting document 4_2025-04-02 in 0.09 sec.
2025-11-14 17:28:55,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,555 - INFO - Going to convert document batch...
2025-11-14 17:28:55,556 - INFO - Processing document 4_2025-04-03
2025-11-14 17:28:55,579 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.


Converted 'data\edgar_documents\PLTR\4_2025-03-27' --> 'data\processed_data\PLTR\4_2025-03-27.md'
Converted 'data\edgar_documents\PLTR\4_2025-04-02' --> 'data\processed_data\PLTR\4_2025-04-02.md'


2025-11-14 17:28:55,614 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,622 - INFO - Going to convert document batch...
2025-11-14 17:28:55,623 - INFO - Processing document 4_2025-04-07
2025-11-14 17:28:55,643 - INFO - Finished converting document 4_2025-04-07 in 0.03 sec.
2025-11-14 17:28:55,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,700 - INFO - Going to convert document batch...
2025-11-14 17:28:55,701 - INFO - Processing document 4_2025-04-24
2025-11-14 17:28:55,720 - INFO - Finished converting document 4_2025-04-24 in 0.06 sec.
2025-11-14 17:28:55,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,783 - INFO - Going to convert document batch...
2025-11-14 17:28:55,784 - INFO - Processing document 4_2025-05-05


Converted 'data\edgar_documents\PLTR\4_2025-04-03' --> 'data\processed_data\PLTR\4_2025-04-03.md'
Converted 'data\edgar_documents\PLTR\4_2025-04-07' --> 'data\processed_data\PLTR\4_2025-04-07.md'
Converted 'data\edgar_documents\PLTR\4_2025-04-24' --> 'data\processed_data\PLTR\4_2025-04-24.md'


2025-11-14 17:28:55,813 - INFO - Finished converting document 4_2025-05-05 in 0.08 sec.
2025-11-14 17:28:55,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,860 - INFO - Going to convert document batch...
2025-11-14 17:28:55,861 - INFO - Processing document 4_2025-05-12
2025-11-14 17:28:55,884 - INFO - Finished converting document 4_2025-05-12 in 0.03 sec.
2025-11-14 17:28:55,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:55,932 - INFO - Going to convert document batch...
2025-11-14 17:28:55,933 - INFO - Processing document 4_2025-05-14
2025-11-14 17:28:55,955 - INFO - Finished converting document 4_2025-05-14 in 0.05 sec.
2025-11-14 17:28:55,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,009 - INFO - Going to convert document batch...
2025-11-14 17:28:56,009 - INFO - Processing document 4_2025-05-22


Converted 'data\edgar_documents\PLTR\4_2025-05-05' --> 'data\processed_data\PLTR\4_2025-05-05.md'
Converted 'data\edgar_documents\PLTR\4_2025-05-12' --> 'data\processed_data\PLTR\4_2025-05-12.md'
Converted 'data\edgar_documents\PLTR\4_2025-05-14' --> 'data\processed_data\PLTR\4_2025-05-14.md'


2025-11-14 17:28:56,038 - INFO - Finished converting document 4_2025-05-22 in 0.05 sec.
2025-11-14 17:28:56,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,098 - INFO - Going to convert document batch...
2025-11-14 17:28:56,098 - INFO - Processing document 4_2025-06-10
2025-11-14 17:28:56,131 - INFO - Finished converting document 4_2025-06-10 in 0.06 sec.
2025-11-14 17:28:56,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,187 - INFO - Going to convert document batch...
2025-11-14 17:28:56,188 - INFO - Processing document 4_2025-06-12
2025-11-14 17:28:56,226 - INFO - Finished converting document 4_2025-06-12 in 0.06 sec.


Converted 'data\edgar_documents\PLTR\4_2025-05-22' --> 'data\processed_data\PLTR\4_2025-05-22.md'
Converted 'data\edgar_documents\PLTR\4_2025-06-10' --> 'data\processed_data\PLTR\4_2025-06-10.md'


2025-11-14 17:28:56,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,280 - INFO - Going to convert document batch...
2025-11-14 17:28:56,281 - INFO - Processing document 4_2025-06-16
2025-11-14 17:28:56,302 - INFO - Finished converting document 4_2025-06-16 in 0.03 sec.
2025-11-14 17:28:56,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,348 - INFO - Going to convert document batch...
2025-11-14 17:28:56,349 - INFO - Processing document 4_2025-06-23
2025-11-14 17:28:56,369 - INFO - Finished converting document 4_2025-06-23 in 0.03 sec.
2025-11-14 17:28:56,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,409 - INFO - Going to convert document batch...
2025-11-14 17:28:56,410 - INFO - Processing document 4_2025-06-24
2025-11-14 17:28:56,428 - INFO - Finished converting document 4_2025-06-24 in 0.03 sec.
2025-11-14 17:28:56,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\4_2025-06-12' --> 'data\processed_data\PLTR\4_2025-06-12.md'
Converted 'data\edgar_documents\PLTR\4_2025-06-16' --> 'data\processed_data\PLTR\4_2025-06-16.md'
Converted 'data\edgar_documents\PLTR\4_2025-06-23' --> 'data\processed_data\PLTR\4_2025-06-23.md'
Converted 'data\edgar_documents\PLTR\4_2025-06-24' --> 'data\processed_data\PLTR\4_2025-06-24.md'


2025-11-14 17:28:56,493 - INFO - Going to convert document batch...
2025-11-14 17:28:56,494 - INFO - Processing document 4_2025-07-03
2025-11-14 17:28:56,524 - INFO - Finished converting document 4_2025-07-03 in 0.06 sec.
2025-11-14 17:28:56,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,602 - INFO - Going to convert document batch...
2025-11-14 17:28:56,603 - INFO - Processing document 4_2025-07-11
2025-11-14 17:28:56,624 - INFO - Finished converting document 4_2025-07-11 in 0.05 sec.
2025-11-14 17:28:56,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,668 - INFO - Going to convert document batch...
2025-11-14 17:28:56,669 - INFO - Processing document 4_2025-07-17
2025-11-14 17:28:56,691 - INFO - Finished converting document 4_2025-07-17 in 0.05 sec.
2025-11-14 17:28:56,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,737 - INFO - Going to convert document batch...
2025-11-14 17:28:56,738 - 

Converted 'data\edgar_documents\PLTR\4_2025-07-03' --> 'data\processed_data\PLTR\4_2025-07-03.md'
Converted 'data\edgar_documents\PLTR\4_2025-07-11' --> 'data\processed_data\PLTR\4_2025-07-11.md'
Converted 'data\edgar_documents\PLTR\4_2025-07-17' --> 'data\processed_data\PLTR\4_2025-07-17.md'


2025-11-14 17:28:56,768 - INFO - Finished converting document 4_2025-08-05 in 0.06 sec.
2025-11-14 17:28:56,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,819 - INFO - Going to convert document batch...
2025-11-14 17:28:56,820 - INFO - Processing document 4_2025-08-07
2025-11-14 17:28:56,847 - INFO - Finished converting document 4_2025-08-07 in 0.05 sec.
2025-11-14 17:28:56,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:56,900 - INFO - Going to convert document batch...
2025-11-14 17:28:56,901 - INFO - Processing document 4_2025-08-22
2025-11-14 17:28:56,950 - INFO - Finished converting document 4_2025-08-22 in 0.08 sec.


Converted 'data\edgar_documents\PLTR\4_2025-08-05' --> 'data\processed_data\PLTR\4_2025-08-05.md'
Converted 'data\edgar_documents\PLTR\4_2025-08-07' --> 'data\processed_data\PLTR\4_2025-08-07.md'
Converted 'data\edgar_documents\PLTR\4_2025-08-22' --> 'data\processed_data\PLTR\4_2025-08-22.md'


2025-11-14 17:28:57,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:57,027 - INFO - Going to convert document batch...
2025-11-14 17:28:57,027 - INFO - Processing document 4_2025-09-03
2025-11-14 17:28:57,046 - INFO - Finished converting document 4_2025-09-03 in 0.06 sec.
2025-11-14 17:28:57,086 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:57,104 - INFO - Going to convert document batch...
2025-11-14 17:28:57,105 - INFO - Processing document 4_2025-09-04
2025-11-14 17:28:57,144 - INFO - Finished converting document 4_2025-09-04 in 0.08 sec.
2025-11-14 17:28:57,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:57,194 - INFO - Going to convert document batch...
2025-11-14 17:28:57,194 - INFO - Processing document 4_2025-09-08
2025-11-14 17:28:57,213 - INFO - Finished converting document 4_2025-09-08 in 0.03 sec.
2025-11-14 17:28:57,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\4_2025-09-03' --> 'data\processed_data\PLTR\4_2025-09-03.md'
Converted 'data\edgar_documents\PLTR\4_2025-09-04' --> 'data\processed_data\PLTR\4_2025-09-04.md'
Converted 'data\edgar_documents\PLTR\4_2025-09-08' --> 'data\processed_data\PLTR\4_2025-09-08.md'


2025-11-14 17:28:57,253 - INFO - Going to convert document batch...
2025-11-14 17:28:57,254 - INFO - Processing document 4_2025-09-09
2025-11-14 17:28:57,272 - INFO - Finished converting document 4_2025-09-09 in 0.03 sec.
2025-11-14 17:28:57,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:57,319 - INFO - Going to convert document batch...
2025-11-14 17:28:57,320 - INFO - Processing document 4_2025-09-15
2025-11-14 17:28:57,346 - INFO - Finished converting document 4_2025-09-15 in 0.05 sec.
2025-11-14 17:28:57,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:57,411 - INFO - Going to convert document batch...
2025-11-14 17:28:57,412 - INFO - Processing document 4_2025-09-22
2025-11-14 17:28:57,432 - INFO - Finished converting document 4_2025-09-22 in 0.06 sec.
2025-11-14 17:28:57,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:57,472 - INFO - Going to convert document batch...
2025-11-14 17:28:57,472 - 

Converted 'data\edgar_documents\PLTR\4_2025-09-09' --> 'data\processed_data\PLTR\4_2025-09-09.md'
Converted 'data\edgar_documents\PLTR\4_2025-09-15' --> 'data\processed_data\PLTR\4_2025-09-15.md'
Converted 'data\edgar_documents\PLTR\4_2025-09-22' --> 'data\processed_data\PLTR\4_2025-09-22.md'


2025-11-14 17:28:57,490 - INFO - Finished converting document 4_2025-09-23 in 0.03 sec.
2025-11-14 17:28:57,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:57,534 - INFO - Going to convert document batch...
2025-11-14 17:28:57,535 - INFO - Processing document 4_2025-10-03


Converted 'data\edgar_documents\PLTR\4_2025-09-23' --> 'data\processed_data\PLTR\4_2025-09-23.md'


2025-11-14 17:28:57,794 - INFO - Finished converting document 4_2025-10-03 in 0.28 sec.
2025-11-14 17:28:57,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:57,849 - INFO - Going to convert document batch...
2025-11-14 17:28:57,850 - INFO - Processing document 4_2025-10-07
2025-11-14 17:28:57,871 - INFO - Finished converting document 4_2025-10-07 in 0.05 sec.
2025-11-14 17:28:57,904 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:57,916 - INFO - Going to convert document batch...
2025-11-14 17:28:57,917 - INFO - Processing document 4_2025-11-05
2025-11-14 17:28:57,943 - INFO - Finished converting document 4_2025-11-05 in 0.05 sec.
2025-11-14 17:28:58,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,017 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\4_2025-10-03' --> 'data\processed_data\PLTR\4_2025-10-03.md'
Converted 'data\edgar_documents\PLTR\4_2025-10-07' --> 'data\processed_data\PLTR\4_2025-10-07.md'
Converted 'data\edgar_documents\PLTR\4_2025-11-05' --> 'data\processed_data\PLTR\4_2025-11-05.md'


2025-11-14 17:28:58,018 - INFO - Processing document 8-K_2023-02-02
2025-11-14 17:28:58,029 - INFO - Finished converting document 8-K_2023-02-02 in 0.06 sec.
2025-11-14 17:28:58,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,078 - INFO - Going to convert document batch...
2025-11-14 17:28:58,079 - INFO - Processing document 8-K_2023-02-13
2025-11-14 17:28:58,098 - INFO - Finished converting document 8-K_2023-02-13 in 0.06 sec.
2025-11-14 17:28:58,121 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,133 - INFO - Going to convert document batch...
2025-11-14 17:28:58,134 - INFO - Processing document 8-K_2023-05-08
2025-11-14 17:28:58,153 - INFO - Finished converting document 8-K_2023-05-08 in 0.05 sec.
2025-11-14 17:28:58,176 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,193 - INFO - Going to convert document batch...
2025-11-14 17:28:58,194 - INFO - Processing document 8-K_2023-06-09
2025-11-14 17:

Converted 'data\edgar_documents\PLTR\8-K_2023-02-02' --> 'data\processed_data\PLTR\8-K_2023-02-02.md'
Converted 'data\edgar_documents\PLTR\8-K_2023-02-13' --> 'data\processed_data\PLTR\8-K_2023-02-13.md'
Converted 'data\edgar_documents\PLTR\8-K_2023-05-08' --> 'data\processed_data\PLTR\8-K_2023-05-08.md'


2025-11-14 17:28:58,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,254 - INFO - Going to convert document batch...
2025-11-14 17:28:58,255 - INFO - Processing document 8-K_2023-08-07
2025-11-14 17:28:58,280 - INFO - Finished converting document 8-K_2023-08-07 in 0.05 sec.
2025-11-14 17:28:58,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,339 - INFO - Going to convert document batch...
2025-11-14 17:28:58,340 - INFO - Processing document 8-K_2023-11-02
2025-11-14 17:28:58,359 - INFO - Finished converting document 8-K_2023-11-02 in 0.06 sec.
2025-11-14 17:28:58,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,392 - INFO - Going to convert document batch...
2025-11-14 17:28:58,394 - INFO - Processing document 8-K_2024-02-05
2025-11-14 17:28:58,413 - INFO - Finished converting document 8-K_2024-02-05 in 0.05 sec.
2025-11-14 17:28:58,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\8-K_2023-06-09' --> 'data\processed_data\PLTR\8-K_2023-06-09.md'
Converted 'data\edgar_documents\PLTR\8-K_2023-08-07' --> 'data\processed_data\PLTR\8-K_2023-08-07.md'
Converted 'data\edgar_documents\PLTR\8-K_2023-11-02' --> 'data\processed_data\PLTR\8-K_2023-11-02.md'
Converted 'data\edgar_documents\PLTR\8-K_2024-02-05' --> 'data\processed_data\PLTR\8-K_2024-02-05.md'


2025-11-14 17:28:58,446 - INFO - Going to convert document batch...
2025-11-14 17:28:58,446 - INFO - Processing document 8-K_2024-05-06
2025-11-14 17:28:58,464 - INFO - Finished converting document 8-K_2024-05-06 in 0.05 sec.
2025-11-14 17:28:58,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,500 - INFO - Going to convert document batch...
2025-11-14 17:28:58,501 - INFO - Processing document 8-K_2024-06-10
2025-11-14 17:28:58,523 - INFO - Finished converting document 8-K_2024-06-10 in 0.05 sec.
2025-11-14 17:28:58,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,574 - INFO - Going to convert document batch...
2025-11-14 17:28:58,575 - INFO - Processing document 8-K_2024-08-05
2025-11-14 17:28:58,591 - INFO - Finished converting document 8-K_2024-08-05 in 0.06 sec.
2025-11-14 17:28:58,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,625 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\PLTR\8-K_2024-05-06' --> 'data\processed_data\PLTR\8-K_2024-05-06.md'
Converted 'data\edgar_documents\PLTR\8-K_2024-06-10' --> 'data\processed_data\PLTR\8-K_2024-06-10.md'
Converted 'data\edgar_documents\PLTR\8-K_2024-08-05' --> 'data\processed_data\PLTR\8-K_2024-08-05.md'


2025-11-14 17:28:58,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,677 - INFO - Going to convert document batch...
2025-11-14 17:28:58,678 - INFO - Processing document 8-K_2024-11-14
2025-11-14 17:28:58,697 - INFO - Finished converting document 8-K_2024-11-14 in 0.03 sec.
2025-11-14 17:28:58,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,748 - INFO - Going to convert document batch...
2025-11-14 17:28:58,749 - INFO - Processing document 8-K_2025-02-03
2025-11-14 17:28:58,783 - INFO - Finished converting document 8-K_2025-02-03 in 0.08 sec.
2025-11-14 17:28:58,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,816 - INFO - Going to convert document batch...
2025-11-14 17:28:58,817 - INFO - Processing document 8-K_2025-02-28
2025-11-14 17:28:58,834 - INFO - Finished converting document 8-K_2025-02-28 in 0.03 sec.


Converted 'data\edgar_documents\PLTR\8-K_2024-11-04' --> 'data\processed_data\PLTR\8-K_2024-11-04.md'
Converted 'data\edgar_documents\PLTR\8-K_2024-11-14' --> 'data\processed_data\PLTR\8-K_2024-11-14.md'
Converted 'data\edgar_documents\PLTR\8-K_2025-02-03' --> 'data\processed_data\PLTR\8-K_2025-02-03.md'


2025-11-14 17:28:58,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,864 - INFO - Going to convert document batch...
2025-11-14 17:28:58,865 - INFO - Processing document 8-K_2025-05-05
2025-11-14 17:28:58,885 - INFO - Finished converting document 8-K_2025-05-05 in 0.05 sec.
2025-11-14 17:28:58,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,922 - INFO - Going to convert document batch...
2025-11-14 17:28:58,923 - INFO - Processing document 8-K_2025-06-09
2025-11-14 17:28:58,947 - INFO - Finished converting document 8-K_2025-06-09 in 0.05 sec.
2025-11-14 17:28:58,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:58,999 - INFO - Going to convert document batch...
2025-11-14 17:28:58,999 - INFO - Processing document 8-K_2025-08-04
2025-11-14 17:28:59,017 - INFO - Finished converting document 8-K_2025-08-04 in 0.06 sec.


Converted 'data\edgar_documents\PLTR\8-K_2025-02-28' --> 'data\processed_data\PLTR\8-K_2025-02-28.md'
Converted 'data\edgar_documents\PLTR\8-K_2025-05-05' --> 'data\processed_data\PLTR\8-K_2025-05-05.md'
Converted 'data\edgar_documents\PLTR\8-K_2025-06-09' --> 'data\processed_data\PLTR\8-K_2025-06-09.md'
Converted 'data\edgar_documents\PLTR\8-K_2025-08-04' --> 'data\processed_data\PLTR\8-K_2025-08-04.md'


2025-11-14 17:28:59,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:28:59,069 - INFO - Going to convert document batch...
2025-11-14 17:28:59,070 - INFO - Processing document 8-K_2025-11-03
2025-11-14 17:28:59,089 - INFO - Finished converting document 8-K_2025-11-03 in 0.06 sec.
2025-11-14 17:28:59,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\8-K_2025-11-03' --> 'data\processed_data\PLTR\8-K_2025-11-03.md'


2025-11-14 17:28:59,341 - INFO - Going to convert document batch...
2025-11-14 17:28:59,342 - INFO - Processing document DEF-14A_2023-04-26
2025-11-14 17:28:59,765 - INFO - Finished converting document DEF-14A_2023-04-26 in 0.67 sec.
2025-11-14 17:28:59,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:00,160 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PLTR\DEF-14A_2023-04-26' --> 'data\processed_data\PLTR\DEF-14A_2023-04-26.md'


2025-11-14 17:29:00,161 - INFO - Processing document DEF-14A_2024-04-26
2025-11-14 17:29:00,503 - INFO - Finished converting document DEF-14A_2024-04-26 in 0.55 sec.
2025-11-14 17:29:00,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\DEF-14A_2024-04-26' --> 'data\processed_data\PLTR\DEF-14A_2024-04-26.md'


2025-11-14 17:29:01,124 - INFO - Going to convert document batch...
2025-11-14 17:29:01,124 - INFO - Processing document DEF-14A_2025-04-25
2025-11-14 17:29:01,511 - INFO - Finished converting document DEF-14A_2025-04-25 in 0.81 sec.
2025-11-14 17:29:01,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PLTR\DEF-14A_2025-04-25' --> 'data\processed_data\PLTR\DEF-14A_2025-04-25.md'
Processed 201 new files. Errors: 0
Found 133 files to process in data\edgar_documents\PM


2025-11-14 17:29:03,018 - INFO - Going to convert document batch...
2025-11-14 17:29:03,018 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:29:03,019 - INFO - Processing document 10-K_2023-02-10
2025-11-14 17:29:06,868 - INFO - Finished converting document 10-K_2023-02-10 in 5.16 sec.
2025-11-14 17:29:07,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-K_2023-02-10' --> 'data\processed_data\PM\10-K_2023-02-10.md'


2025-11-14 17:29:09,049 - INFO - Going to convert document batch...
2025-11-14 17:29:09,050 - INFO - Processing document 10-K_2024-02-08
2025-11-14 17:29:13,542 - INFO - Finished converting document 10-K_2024-02-08 in 5.81 sec.
2025-11-14 17:29:14,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-K_2024-02-08' --> 'data\processed_data\PM\10-K_2024-02-08.md'


2025-11-14 17:29:15,430 - INFO - Going to convert document batch...
2025-11-14 17:29:15,431 - INFO - Processing document 10-K_2025-02-06
2025-11-14 17:29:19,805 - INFO - Finished converting document 10-K_2025-02-06 in 5.33 sec.
2025-11-14 17:29:20,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-K_2025-02-06' --> 'data\processed_data\PM\10-K_2025-02-06.md'


2025-11-14 17:29:21,282 - INFO - Going to convert document batch...
2025-11-14 17:29:21,283 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 17:29:22,676 - INFO - Finished converting document 10-Q_2023-04-26 in 1.95 sec.
2025-11-14 17:29:23,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-Q_2023-04-26' --> 'data\processed_data\PM\10-Q_2023-04-26.md'


2025-11-14 17:29:24,670 - INFO - Going to convert document batch...
2025-11-14 17:29:24,671 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 17:29:26,610 - INFO - Finished converting document 10-Q_2023-07-27 in 3.26 sec.
2025-11-14 17:29:27,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-Q_2023-07-27' --> 'data\processed_data\PM\10-Q_2023-07-27.md'


2025-11-14 17:29:28,603 - INFO - Going to convert document batch...
2025-11-14 17:29:28,604 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 17:29:30,572 - INFO - Finished converting document 10-Q_2023-10-26 in 3.12 sec.
2025-11-14 17:29:31,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-Q_2023-10-26' --> 'data\processed_data\PM\10-Q_2023-10-26.md'


2025-11-14 17:29:32,368 - INFO - Going to convert document batch...
2025-11-14 17:29:32,369 - INFO - Processing document 10-Q_2024-04-26
2025-11-14 17:29:33,638 - INFO - Finished converting document 10-Q_2024-04-26 in 2.23 sec.
2025-11-14 17:29:34,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-Q_2024-04-26' --> 'data\processed_data\PM\10-Q_2024-04-26.md'


2025-11-14 17:29:35,361 - INFO - Going to convert document batch...
2025-11-14 17:29:35,361 - INFO - Processing document 10-Q_2024-07-25
2025-11-14 17:29:37,083 - INFO - Finished converting document 10-Q_2024-07-25 in 2.81 sec.
2025-11-14 17:29:37,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-Q_2024-07-25' --> 'data\processed_data\PM\10-Q_2024-07-25.md'


2025-11-14 17:29:38,876 - INFO - Going to convert document batch...
2025-11-14 17:29:38,877 - INFO - Processing document 10-Q_2024-10-24
2025-11-14 17:29:40,583 - INFO - Finished converting document 10-Q_2024-10-24 in 2.78 sec.
2025-11-14 17:29:41,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-Q_2024-10-24' --> 'data\processed_data\PM\10-Q_2024-10-24.md'


2025-11-14 17:29:41,809 - INFO - Going to convert document batch...
2025-11-14 17:29:41,810 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 17:29:42,952 - INFO - Finished converting document 10-Q_2025-04-24 in 1.66 sec.
2025-11-14 17:29:44,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-Q_2025-04-24' --> 'data\processed_data\PM\10-Q_2025-04-24.md'


2025-11-14 17:29:44,786 - INFO - Going to convert document batch...
2025-11-14 17:29:44,787 - INFO - Processing document 10-Q_2025-07-25
2025-11-14 17:29:46,679 - INFO - Finished converting document 10-Q_2025-07-25 in 2.62 sec.
2025-11-14 17:29:47,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\10-Q_2025-07-25' --> 'data\processed_data\PM\10-Q_2025-07-25.md'


2025-11-14 17:29:48,170 - INFO - Going to convert document batch...
2025-11-14 17:29:48,171 - INFO - Processing document 10-Q_2025-10-24
2025-11-14 17:29:49,829 - INFO - Finished converting document 10-Q_2025-10-24 in 2.36 sec.
2025-11-14 17:29:51,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:51,247 - INFO - Going to convert document batch...
2025-11-14 17:29:51,248 - INFO - Processing document 4_2023-01-04
2025-11-14 17:29:51,269 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 17:29:51,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:51,330 - INFO - Going to convert document batch...
2025-11-14 17:29:51,330 - INFO - Processing document 4_2023-02-10
2025-11-14 17:29:51,350 - INFO - Finished converting document 4_2023-02-10 in 0.05 sec.
2025-11-14 17:29:51,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:51,389 - INFO - Going to convert document batch...
2025-11-14 17:29:51,

Converted 'data\edgar_documents\PM\10-Q_2025-10-24' --> 'data\processed_data\PM\10-Q_2025-10-24.md'
Converted 'data\edgar_documents\PM\4_2023-01-04' --> 'data\processed_data\PM\4_2023-01-04.md'
Converted 'data\edgar_documents\PM\4_2023-02-10' --> 'data\processed_data\PM\4_2023-02-10.md'


2025-11-14 17:29:51,452 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:29:51,453 - ERROR - Input document 4_2023-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:29:51,454 - INFO - Going to convert document batch...
2025-11-14 17:29:51,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:51,476 - INFO - Going to convert document batch...
2025-11-14 17:29:51,477 - INFO - Processing document 4_2023-02-17
2025-11-14 17:29:51,495 - INFO - Fin

Converted 'data\edgar_documents\PM\4_2023-02-13' --> 'data\processed_data\PM\4_2023-02-13.md'
Error processing data\edgar_documents\PM\4_2023-02-14: File format not allowed: data\edgar_documents\PM\4_2023-02-14
Converted 'data\edgar_documents\PM\4_2023-02-17' --> 'data\processed_data\PM\4_2023-02-17.md'
Converted 'data\edgar_documents\PM\4_2023-02-22' --> 'data\processed_data\PM\4_2023-02-22.md'


2025-11-14 17:29:51,625 - INFO - Processing document 4_2023-03-06
2025-11-14 17:29:51,643 - INFO - Finished converting document 4_2023-03-06 in 0.03 sec.
2025-11-14 17:29:51,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:51,692 - INFO - Going to convert document batch...
2025-11-14 17:29:51,693 - INFO - Processing document 4_2023-04-04
2025-11-14 17:29:51,720 - INFO - Finished converting document 4_2023-04-04 in 0.06 sec.
2025-11-14 17:29:51,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:51,767 - INFO - Going to convert document batch...
2025-11-14 17:29:51,767 - INFO - Processing document 4_2023-04-07
2025-11-14 17:29:51,788 - INFO - Finished converting document 4_2023-04-07 in 0.03 sec.
2025-11-14 17:29:51,837 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:29:51,837 - ERROR - Input document 4_2023-04-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>

Converted 'data\edgar_documents\PM\4_2023-03-06' --> 'data\processed_data\PM\4_2023-03-06.md'
Converted 'data\edgar_documents\PM\4_2023-04-04' --> 'data\processed_data\PM\4_2023-04-04.md'
Converted 'data\edgar_documents\PM\4_2023-04-07' --> 'data\processed_data\PM\4_2023-04-07.md'


2025-11-14 17:29:51,839 - INFO - Going to convert document batch...
2025-11-14 17:29:51,859 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:29:51,860 - ERROR - Input document 4_2023-04-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:29:51,861 - INFO - Going to convert document batch...
2025-11-14 17:29:51,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:51,881 - INFO - Going to convert document batch...
2025-11-14 17:29:51,882 - INFO - P

Error processing data\edgar_documents\PM\4_2023-04-27: File format not allowed: data\edgar_documents\PM\4_2023-04-27
Error processing data\edgar_documents\PM\4_2023-04-28: File format not allowed: data\edgar_documents\PM\4_2023-04-28
Converted 'data\edgar_documents\PM\4_2023-05-05' --> 'data\processed_data\PM\4_2023-05-05.md'
Converted 'data\edgar_documents\PM\4_2023-07-05' --> 'data\processed_data\PM\4_2023-07-05.md'


2025-11-14 17:29:52,045 - ERROR - Input document 4_2023-09-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:29:52,047 - INFO - Going to convert document batch...
2025-11-14 17:29:52,068 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:29:52,069 - ERROR - Input document 4_2023-09-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\PM\4_2023-09-05: File format not allowed: data\edgar_documents\PM\4_2023-09-05
Error processing data\edgar_documents\PM\4_2023-09-06: File format not allowed: data\edgar_documents\PM\4_2023-09-06
Converted 'data\edgar_documents\PM\4_2023-10-03' --> 'data\processed_data\PM\4_2023-10-03.md'
Converted 'data\edgar_documents\PM\4_2023-11-30' --> 'data\processed_data\PM\4_2023-11-30.md'


2025-11-14 17:29:52,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:52,285 - INFO - Going to convert document batch...
2025-11-14 17:29:52,287 - INFO - Processing document 4_2024-02-09
2025-11-14 17:29:52,310 - INFO - Finished converting document 4_2024-02-09 in 0.05 sec.
2025-11-14 17:29:52,354 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:29:52,355 - ERROR - Input document 4_2024-02-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:29

Converted 'data\edgar_documents\PM\4_2024-01-03' --> 'data\processed_data\PM\4_2024-01-03.md'
Converted 'data\edgar_documents\PM\4_2024-02-09' --> 'data\processed_data\PM\4_2024-02-09.md'
Error processing data\edgar_documents\PM\4_2024-02-12: File format not allowed: data\edgar_documents\PM\4_2024-02-12
Converted 'data\edgar_documents\PM\4_2024-02-23' --> 'data\processed_data\PM\4_2024-02-23.md'


2025-11-14 17:29:52,464 - INFO - Going to convert document batch...
2025-11-14 17:29:52,464 - INFO - Processing document 4_2024-03-11
2025-11-14 17:29:52,483 - INFO - Finished converting document 4_2024-03-11 in 0.05 sec.
2025-11-14 17:29:52,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:52,532 - INFO - Going to convert document batch...
2025-11-14 17:29:52,533 - INFO - Processing document 4_2024-03-19
2025-11-14 17:29:52,553 - INFO - Finished converting document 4_2024-03-19 in 0.03 sec.
2025-11-14 17:29:52,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:52,597 - INFO - Going to convert document batch...
2025-11-14 17:29:52,598 - INFO - Processing document 4_2024-04-02
2025-11-14 17:29:52,619 - INFO - Finished converting document 4_2024-04-02 in 0.03 sec.
2025-11-14 17:29:52,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:52,660 - INFO - Going to convert document batch...
2025-11-14 17:29:52,661 - 

Converted 'data\edgar_documents\PM\4_2024-03-11' --> 'data\processed_data\PM\4_2024-03-11.md'
Converted 'data\edgar_documents\PM\4_2024-03-19' --> 'data\processed_data\PM\4_2024-03-19.md'
Converted 'data\edgar_documents\PM\4_2024-04-02' --> 'data\processed_data\PM\4_2024-04-02.md'
Converted 'data\edgar_documents\PM\4_2024-04-26' --> 'data\processed_data\PM\4_2024-04-26.md'


2025-11-14 17:29:52,720 - INFO - Going to convert document batch...
2025-11-14 17:29:52,721 - INFO - Processing document 4_2024-05-10
2025-11-14 17:29:52,739 - INFO - Finished converting document 4_2024-05-10 in 0.03 sec.
2025-11-14 17:29:52,780 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:29:52,781 - ERROR - Input document 4_2024-06-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:29:52,782 - INFO - Going to convert document batch...
2025-11-14 17:29:52,803 - IN

Converted 'data\edgar_documents\PM\4_2024-05-10' --> 'data\processed_data\PM\4_2024-05-10.md'
Error processing data\edgar_documents\PM\4_2024-06-03: File format not allowed: data\edgar_documents\PM\4_2024-06-03
Error processing data\edgar_documents\PM\4_2024-06-04: File format not allowed: data\edgar_documents\PM\4_2024-06-04
Converted 'data\edgar_documents\PM\4_2024-07-29' --> 'data\processed_data\PM\4_2024-07-29.md'
Converted 'data\edgar_documents\PM\4_2024-08-12' --> 'data\processed_data\PM\4_2024-08-12.md'


2025-11-14 17:29:52,970 - INFO - Going to convert document batch...
2025-11-14 17:29:52,971 - INFO - Processing document 4_2024-08-23
2025-11-14 17:29:52,990 - INFO - Finished converting document 4_2024-08-23 in 0.03 sec.
2025-11-14 17:29:53,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:53,044 - INFO - Going to convert document batch...
2025-11-14 17:29:53,045 - INFO - Processing document 4_2024-10-25
2025-11-14 17:29:53,064 - INFO - Finished converting document 4_2024-10-25 in 0.05 sec.
2025-11-14 17:29:53,135 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:29:53,136 - ERROR - Input document 4_2024-10-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\PM\4_2024-08-23' --> 'data\processed_data\PM\4_2024-08-23.md'
Converted 'data\edgar_documents\PM\4_2024-10-25' --> 'data\processed_data\PM\4_2024-10-25.md'
Error processing data\edgar_documents\PM\4_2024-10-30: File format not allowed: data\edgar_documents\PM\4_2024-10-30
Error processing data\edgar_documents\PM\4_2024-10-31: File format not allowed: data\edgar_documents\PM\4_2024-10-31


2025-11-14 17:29:53,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:53,239 - INFO - Going to convert document batch...
2025-11-14 17:29:53,240 - INFO - Processing document 4_2024-11-08
2025-11-14 17:29:53,261 - INFO - Finished converting document 4_2024-11-08 in 0.05 sec.
2025-11-14 17:29:53,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:53,309 - INFO - Going to convert document batch...
2025-11-14 17:29:53,309 - INFO - Processing document 4_2025-02-07
2025-11-14 17:29:53,330 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.
2025-11-14 17:29:53,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:53,372 - INFO - Going to convert document batch...
2025-11-14 17:29:53,373 - INFO - Processing document 4_2025-02-13
2025-11-14 17:29:53,393 - INFO - Finished converting document 4_2025-02-13 in 0.05 sec.


Converted 'data\edgar_documents\PM\4_2024-11-01' --> 'data\processed_data\PM\4_2024-11-01.md'
Converted 'data\edgar_documents\PM\4_2024-11-08' --> 'data\processed_data\PM\4_2024-11-08.md'
Converted 'data\edgar_documents\PM\4_2025-02-07' --> 'data\processed_data\PM\4_2025-02-07.md'


2025-11-14 17:29:53,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:53,433 - INFO - Going to convert document batch...
2025-11-14 17:29:53,434 - INFO - Processing document 4_2025-02-21
2025-11-14 17:29:53,455 - INFO - Finished converting document 4_2025-02-21 in 0.05 sec.
2025-11-14 17:29:53,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:53,511 - INFO - Going to convert document batch...
2025-11-14 17:29:53,513 - INFO - Processing document 4_2025-02-25
2025-11-14 17:29:53,544 - INFO - Finished converting document 4_2025-02-25 in 0.06 sec.
2025-11-14 17:29:53,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:53,588 - INFO - Going to convert document batch...
2025-11-14 17:29:53,589 - INFO - Processing document 4_2025-03-07


Converted 'data\edgar_documents\PM\4_2025-02-13' --> 'data\processed_data\PM\4_2025-02-13.md'
Converted 'data\edgar_documents\PM\4_2025-02-21' --> 'data\processed_data\PM\4_2025-02-21.md'
Converted 'data\edgar_documents\PM\4_2025-02-25' --> 'data\processed_data\PM\4_2025-02-25.md'


2025-11-14 17:29:53,607 - INFO - Finished converting document 4_2025-03-07 in 0.05 sec.
2025-11-14 17:29:53,651 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:29:53,651 - ERROR - Input document 4_2025-04-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:29:53,652 - INFO - Going to convert document batch...
2025-11-14 17:29:53,676 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:29:53,676 - ERROR - Input document 4_2025-04-29 with forma

Converted 'data\edgar_documents\PM\4_2025-03-07' --> 'data\processed_data\PM\4_2025-03-07.md'
Error processing data\edgar_documents\PM\4_2025-04-28: File format not allowed: data\edgar_documents\PM\4_2025-04-28
Error processing data\edgar_documents\PM\4_2025-04-29: File format not allowed: data\edgar_documents\PM\4_2025-04-29
Converted 'data\edgar_documents\PM\4_2025-05-09' --> 'data\processed_data\PM\4_2025-05-09.md'
Error processing data\edgar_documents\PM\4_2025-06-03: File format not allowed: data\edgar_documents\PM\4_2025-06-03
Error processing data\edgar_documents\PM\4_2025-06-04: File format not allowed: data\edgar_documents\PM\4_2025-06-04
Error processing data\edgar_documents\PM\4_2025-10-27: File format not allowed: data\edgar_documents\PM\4_2025-10-27


2025-11-14 17:29:53,828 - ERROR - Input document 4_2025-10-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:29:53,829 - INFO - Going to convert document batch...
2025-11-14 17:29:53,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:53,878 - INFO - Going to convert document batch...
2025-11-14 17:29:53,879 - INFO - Processing document 8-K_2023-01-11
2025-11-14 17:29:53,921 - INFO - Finished converting document 8-K_2023-01-11 in 0.09 sec.
2025-11-14 17:29:53,953 - INFO - d

Error processing data\edgar_documents\PM\4_2025-10-28: File format not allowed: data\edgar_documents\PM\4_2025-10-28
Converted 'data\edgar_documents\PM\8-K_2023-01-11' --> 'data\processed_data\PM\8-K_2023-01-11.md'


2025-11-14 17:29:54,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:54,082 - INFO - Going to convert document batch...
2025-11-14 17:29:54,083 - INFO - Processing document 8-K_2023-02-09
2025-11-14 17:29:54,133 - INFO - Finished converting document 8-K_2023-02-09 in 0.09 sec.
2025-11-14 17:29:54,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:54,204 - INFO - Going to convert document batch...
2025-11-14 17:29:54,205 - INFO - Processing document 8-K_2023-02-17


Converted 'data\edgar_documents\PM\8-K_2023-01-30' --> 'data\processed_data\PM\8-K_2023-01-30.md'
Converted 'data\edgar_documents\PM\8-K_2023-02-09' --> 'data\processed_data\PM\8-K_2023-02-09.md'


2025-11-14 17:29:54,240 - INFO - Finished converting document 8-K_2023-02-17 in 0.08 sec.
2025-11-14 17:29:54,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:54,304 - INFO - Going to convert document batch...
2025-11-14 17:29:54,305 - INFO - Processing document 8-K_2023-02-22
2025-11-14 17:29:54,348 - INFO - Finished converting document 8-K_2023-02-22 in 0.09 sec.
2025-11-14 17:29:54,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:54,410 - INFO - Going to convert document batch...
2025-11-14 17:29:54,411 - INFO - Processing document 8-K_2023-03-03
2025-11-14 17:29:54,452 - INFO - Finished converting document 8-K_2023-03-03 in 0.09 sec.


Converted 'data\edgar_documents\PM\8-K_2023-02-17' --> 'data\processed_data\PM\8-K_2023-02-17.md'
Converted 'data\edgar_documents\PM\8-K_2023-02-22' --> 'data\processed_data\PM\8-K_2023-02-22.md'


2025-11-14 17:29:54,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:54,538 - INFO - Going to convert document batch...
2025-11-14 17:29:54,539 - INFO - Processing document 8-K_2023-03-09
2025-11-14 17:29:54,585 - INFO - Finished converting document 8-K_2023-03-09 in 0.11 sec.
2025-11-14 17:29:54,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:54,652 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PM\8-K_2023-03-03' --> 'data\processed_data\PM\8-K_2023-03-03.md'
Converted 'data\edgar_documents\PM\8-K_2023-03-09' --> 'data\processed_data\PM\8-K_2023-03-09.md'


2025-11-14 17:29:54,654 - INFO - Processing document 8-K_2023-03-28
2025-11-14 17:29:54,698 - INFO - Finished converting document 8-K_2023-03-28 in 0.11 sec.
2025-11-14 17:29:54,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:54,763 - INFO - Going to convert document batch...
2025-11-14 17:29:54,764 - INFO - Processing document 8-K_2023-04-20
2025-11-14 17:29:54,803 - INFO - Finished converting document 8-K_2023-04-20 in 0.08 sec.
2025-11-14 17:29:54,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:54,864 - INFO - Going to convert document batch...
2025-11-14 17:29:54,864 - INFO - Processing document 8-K_2023-05-01


Converted 'data\edgar_documents\PM\8-K_2023-03-28' --> 'data\processed_data\PM\8-K_2023-03-28.md'
Converted 'data\edgar_documents\PM\8-K_2023-04-20' --> 'data\processed_data\PM\8-K_2023-04-20.md'


2025-11-14 17:29:54,933 - INFO - Finished converting document 8-K_2023-05-01 in 0.12 sec.
2025-11-14 17:29:54,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:55,038 - INFO - Going to convert document batch...
2025-11-14 17:29:55,039 - INFO - Processing document 8-K_2023-05-03
2025-11-14 17:29:55,077 - INFO - Finished converting document 8-K_2023-05-03 in 0.09 sec.
2025-11-14 17:29:55,108 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:55,147 - INFO - Going to convert document batch...
2025-11-14 17:29:55,148 - INFO - Processing document 8-K_2023-05-09


Converted 'data\edgar_documents\PM\8-K_2023-05-01' --> 'data\processed_data\PM\8-K_2023-05-01.md'
Converted 'data\edgar_documents\PM\8-K_2023-05-03' --> 'data\processed_data\PM\8-K_2023-05-03.md'


2025-11-14 17:29:55,206 - INFO - Finished converting document 8-K_2023-05-09 in 0.11 sec.
2025-11-14 17:29:55,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:55,281 - INFO - Going to convert document batch...
2025-11-14 17:29:55,282 - INFO - Processing document 8-K_2023-05-23
2025-11-14 17:29:55,321 - INFO - Finished converting document 8-K_2023-05-23 in 0.08 sec.
2025-11-14 17:29:55,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:55,379 - INFO - Going to convert document batch...
2025-11-14 17:29:55,379 - INFO - Processing document 8-K_2023-06-06
2025-11-14 17:29:55,415 - INFO - Finished converting document 8-K_2023-06-06 in 0.06 sec.


Converted 'data\edgar_documents\PM\8-K_2023-05-09' --> 'data\processed_data\PM\8-K_2023-05-09.md'
Converted 'data\edgar_documents\PM\8-K_2023-05-23' --> 'data\processed_data\PM\8-K_2023-05-23.md'


2025-11-14 17:29:55,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:55,474 - INFO - Going to convert document batch...
2025-11-14 17:29:55,475 - INFO - Processing document 8-K_2023-06-09
2025-11-14 17:29:55,539 - INFO - Finished converting document 8-K_2023-06-09 in 0.09 sec.
2025-11-14 17:29:55,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\8-K_2023-06-06' --> 'data\processed_data\PM\8-K_2023-06-06.md'
Converted 'data\edgar_documents\PM\8-K_2023-06-09' --> 'data\processed_data\PM\8-K_2023-06-09.md'


2025-11-14 17:29:56,058 - INFO - Going to convert document batch...
2025-11-14 17:29:56,059 - INFO - Processing document 8-K_2023-07-20
2025-11-14 17:29:56,094 - INFO - Finished converting document 8-K_2023-07-20 in 0.53 sec.
2025-11-14 17:29:56,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:56,159 - INFO - Going to convert document batch...
2025-11-14 17:29:56,159 - INFO - Processing document 8-K_2023-07-28
2025-11-14 17:29:56,198 - INFO - Finished converting document 8-K_2023-07-28 in 0.09 sec.
2025-11-14 17:29:56,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:56,286 - INFO - Going to convert document batch...
2025-11-14 17:29:56,286 - INFO - Processing document 8-K_2023-09-07


Converted 'data\edgar_documents\PM\8-K_2023-07-20' --> 'data\processed_data\PM\8-K_2023-07-20.md'
Converted 'data\edgar_documents\PM\8-K_2023-07-28' --> 'data\processed_data\PM\8-K_2023-07-28.md'


2025-11-14 17:29:56,342 - INFO - Finished converting document 8-K_2023-09-07 in 0.12 sec.
2025-11-14 17:29:56,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:56,418 - INFO - Going to convert document batch...
2025-11-14 17:29:56,420 - INFO - Processing document 8-K_2023-09-13
2025-11-14 17:29:56,489 - INFO - Finished converting document 8-K_2023-09-13 in 0.11 sec.
2025-11-14 17:29:56,543 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\8-K_2023-09-07' --> 'data\processed_data\PM\8-K_2023-09-07.md'
Converted 'data\edgar_documents\PM\8-K_2023-09-13' --> 'data\processed_data\PM\8-K_2023-09-13.md'


2025-11-14 17:29:56,571 - INFO - Going to convert document batch...
2025-11-14 17:29:56,572 - INFO - Processing document 8-K_2023-09-18
2025-11-14 17:29:56,611 - INFO - Finished converting document 8-K_2023-09-18 in 0.09 sec.
2025-11-14 17:29:56,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:56,679 - INFO - Going to convert document batch...
2025-11-14 17:29:56,679 - INFO - Processing document 8-K_2023-09-20
2025-11-14 17:29:56,726 - INFO - Finished converting document 8-K_2023-09-20 in 0.09 sec.
2025-11-14 17:29:56,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:56,796 - INFO - Going to convert document batch...
2025-11-14 17:29:56,797 - INFO - Processing document 8-K_2023-09-28


Converted 'data\edgar_documents\PM\8-K_2023-09-18' --> 'data\processed_data\PM\8-K_2023-09-18.md'
Converted 'data\edgar_documents\PM\8-K_2023-09-20' --> 'data\processed_data\PM\8-K_2023-09-20.md'


2025-11-14 17:29:56,838 - INFO - Finished converting document 8-K_2023-09-28 in 0.08 sec.
2025-11-14 17:29:56,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:56,899 - INFO - Going to convert document batch...
2025-11-14 17:29:56,900 - INFO - Processing document 8-K_2023-10-19
2025-11-14 17:29:56,944 - INFO - Finished converting document 8-K_2023-10-19 in 0.08 sec.
2025-11-14 17:29:57,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:57,036 - INFO - Going to convert document batch...
2025-11-14 17:29:57,037 - INFO - Processing document 8-K_2023-12-07


Converted 'data\edgar_documents\PM\8-K_2023-09-28' --> 'data\processed_data\PM\8-K_2023-09-28.md'
Converted 'data\edgar_documents\PM\8-K_2023-10-19' --> 'data\processed_data\PM\8-K_2023-10-19.md'


2025-11-14 17:29:57,073 - INFO - Finished converting document 8-K_2023-12-07 in 0.11 sec.
2025-11-14 17:29:57,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:57,135 - INFO - Going to convert document batch...
2025-11-14 17:29:57,136 - INFO - Processing document 8-K_2023-12-08
2025-11-14 17:29:57,175 - INFO - Finished converting document 8-K_2023-12-08 in 0.08 sec.
2025-11-14 17:29:57,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:57,233 - INFO - Going to convert document batch...
2025-11-14 17:29:57,234 - INFO - Processing document 8-K_2024-01-24
2025-11-14 17:29:57,281 - INFO - Finished converting document 8-K_2024-01-24 in 0.09 sec.


Converted 'data\edgar_documents\PM\8-K_2023-12-07' --> 'data\processed_data\PM\8-K_2023-12-07.md'
Converted 'data\edgar_documents\PM\8-K_2023-12-08' --> 'data\processed_data\PM\8-K_2023-12-08.md'


2025-11-14 17:29:57,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:57,387 - INFO - Going to convert document batch...
2025-11-14 17:29:57,388 - INFO - Processing document 8-K_2024-02-02
2025-11-14 17:29:57,433 - INFO - Finished converting document 8-K_2024-02-02 in 0.11 sec.
2025-11-14 17:29:57,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:57,494 - INFO - Going to convert document batch...
2025-11-14 17:29:57,495 - INFO - Processing document 8-K_2024-02-08


Converted 'data\edgar_documents\PM\8-K_2024-01-24' --> 'data\processed_data\PM\8-K_2024-01-24.md'
Converted 'data\edgar_documents\PM\8-K_2024-02-02' --> 'data\processed_data\PM\8-K_2024-02-02.md'


2025-11-14 17:29:57,535 - INFO - Finished converting document 8-K_2024-02-08 in 0.08 sec.
2025-11-14 17:29:57,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:57,597 - INFO - Going to convert document batch...
2025-11-14 17:29:57,598 - INFO - Processing document 8-K_2024-02-13
2025-11-14 17:29:57,662 - INFO - Finished converting document 8-K_2024-02-13 in 0.11 sec.
2025-11-14 17:29:57,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:57,732 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PM\8-K_2024-02-08' --> 'data\processed_data\PM\8-K_2024-02-08.md'
Converted 'data\edgar_documents\PM\8-K_2024-02-13' --> 'data\processed_data\PM\8-K_2024-02-13.md'


2025-11-14 17:29:57,733 - INFO - Processing document 8-K_2024-02-21
2025-11-14 17:29:57,773 - INFO - Finished converting document 8-K_2024-02-21 in 0.08 sec.
2025-11-14 17:29:57,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:57,858 - INFO - Going to convert document batch...
2025-11-14 17:29:57,859 - INFO - Processing document 8-K_2024-02-27
2025-11-14 17:29:57,899 - INFO - Finished converting document 8-K_2024-02-27 in 0.09 sec.
2025-11-14 17:29:57,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:57,952 - INFO - Going to convert document batch...
2025-11-14 17:29:57,953 - INFO - Processing document 8-K_2024-03-07
2025-11-14 17:29:57,990 - INFO - Finished converting document 8-K_2024-03-07 in 0.06 sec.


Converted 'data\edgar_documents\PM\8-K_2024-02-21' --> 'data\processed_data\PM\8-K_2024-02-21.md'
Converted 'data\edgar_documents\PM\8-K_2024-02-27' --> 'data\processed_data\PM\8-K_2024-02-27.md'


2025-11-14 17:29:58,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:58,042 - INFO - Going to convert document batch...
2025-11-14 17:29:58,043 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:29:58,083 - INFO - Finished converting document 8-K_2024-04-23 in 0.08 sec.
2025-11-14 17:29:58,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:58,140 - INFO - Going to convert document batch...
2025-11-14 17:29:58,141 - INFO - Processing document 8-K_2024-05-08
2025-11-14 17:29:58,177 - INFO - Finished converting document 8-K_2024-05-08 in 0.06 sec.


Converted 'data\edgar_documents\PM\8-K_2024-03-07' --> 'data\processed_data\PM\8-K_2024-03-07.md'
Converted 'data\edgar_documents\PM\8-K_2024-04-23' --> 'data\processed_data\PM\8-K_2024-04-23.md'


2025-11-14 17:29:58,206 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:58,232 - INFO - Going to convert document batch...
2025-11-14 17:29:58,237 - INFO - Processing document 8-K_2024-05-09
2025-11-14 17:29:58,308 - INFO - Finished converting document 8-K_2024-05-09 in 0.12 sec.
2025-11-14 17:29:58,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:58,366 - INFO - Going to convert document batch...
2025-11-14 17:29:58,367 - INFO - Processing document 8-K_2024-06-04


Converted 'data\edgar_documents\PM\8-K_2024-05-08' --> 'data\processed_data\PM\8-K_2024-05-08.md'
Converted 'data\edgar_documents\PM\8-K_2024-05-09' --> 'data\processed_data\PM\8-K_2024-05-09.md'


2025-11-14 17:29:58,402 - INFO - Finished converting document 8-K_2024-06-04 in 0.08 sec.
2025-11-14 17:29:58,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:58,471 - INFO - Going to convert document batch...
2025-11-14 17:29:58,472 - INFO - Processing document 8-K_2024-06-06


Converted 'data\edgar_documents\PM\8-K_2024-06-04' --> 'data\processed_data\PM\8-K_2024-06-04.md'


2025-11-14 17:29:58,744 - INFO - Finished converting document 8-K_2024-06-06 in 0.33 sec.
2025-11-14 17:29:58,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:58,839 - INFO - Going to convert document batch...
2025-11-14 17:29:58,840 - INFO - Processing document 8-K_2024-06-07
2025-11-14 17:29:58,887 - INFO - Finished converting document 8-K_2024-06-07 in 0.12 sec.
2025-11-14 17:29:58,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:58,939 - INFO - Going to convert document batch...
2025-11-14 17:29:58,940 - INFO - Processing document 8-K_2024-06-17


Converted 'data\edgar_documents\PM\8-K_2024-06-06' --> 'data\processed_data\PM\8-K_2024-06-06.md'
Converted 'data\edgar_documents\PM\8-K_2024-06-07' --> 'data\processed_data\PM\8-K_2024-06-07.md'


2025-11-14 17:29:58,977 - INFO - Finished converting document 8-K_2024-06-17 in 0.06 sec.
2025-11-14 17:29:59,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:59,030 - INFO - Going to convert document batch...
2025-11-14 17:29:59,031 - INFO - Processing document 8-K_2024-07-23
2025-11-14 17:29:59,071 - INFO - Finished converting document 8-K_2024-07-23 in 0.08 sec.
2025-11-14 17:29:59,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:59,124 - INFO - Going to convert document batch...
2025-11-14 17:29:59,125 - INFO - Processing document 8-K_2024-09-03
2025-11-14 17:29:59,160 - INFO - Finished converting document 8-K_2024-09-03 in 0.06 sec.


Converted 'data\edgar_documents\PM\8-K_2024-06-17' --> 'data\processed_data\PM\8-K_2024-06-17.md'
Converted 'data\edgar_documents\PM\8-K_2024-07-23' --> 'data\processed_data\PM\8-K_2024-07-23.md'
Converted 'data\edgar_documents\PM\8-K_2024-09-03' --> 'data\processed_data\PM\8-K_2024-09-03.md'


2025-11-14 17:29:59,206 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:59,227 - INFO - Going to convert document batch...
2025-11-14 17:29:59,229 - INFO - Processing document 8-K_2024-09-12
2025-11-14 17:29:59,268 - INFO - Finished converting document 8-K_2024-09-12 in 0.09 sec.
2025-11-14 17:29:59,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:59,342 - INFO - Going to convert document batch...
2025-11-14 17:29:59,342 - INFO - Processing document 8-K_2024-09-17
2025-11-14 17:29:59,380 - INFO - Finished converting document 8-K_2024-09-17 in 0.09 sec.
2025-11-14 17:29:59,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:59,432 - INFO - Going to convert document batch...
2025-11-14 17:29:59,433 - INFO - Processing document 8-K_2024-10-18
2025-11-14 17:29:59,471 - INFO - Finished converting document 8-K_2024-10-18 in 0.08 sec.


Converted 'data\edgar_documents\PM\8-K_2024-09-12' --> 'data\processed_data\PM\8-K_2024-09-12.md'
Converted 'data\edgar_documents\PM\8-K_2024-09-17' --> 'data\processed_data\PM\8-K_2024-09-17.md'


2025-11-14 17:29:59,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:59,527 - INFO - Going to convert document batch...
2025-11-14 17:29:59,528 - INFO - Processing document 8-K_2024-10-22
2025-11-14 17:29:59,590 - INFO - Finished converting document 8-K_2024-10-22 in 0.11 sec.
2025-11-14 17:29:59,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:59,659 - INFO - Going to convert document batch...
2025-11-14 17:29:59,660 - INFO - Processing document 8-K_2024-11-01


Converted 'data\edgar_documents\PM\8-K_2024-10-18' --> 'data\processed_data\PM\8-K_2024-10-18.md'
Converted 'data\edgar_documents\PM\8-K_2024-10-22' --> 'data\processed_data\PM\8-K_2024-10-22.md'


2025-11-14 17:29:59,724 - INFO - Finished converting document 8-K_2024-11-01 in 0.11 sec.
2025-11-14 17:29:59,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:59,799 - INFO - Going to convert document batch...
2025-11-14 17:29:59,799 - INFO - Processing document 8-K_2024-11-21
2025-11-14 17:29:59,843 - INFO - Finished converting document 8-K_2024-11-21 in 0.09 sec.
2025-11-14 17:29:59,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:29:59,923 - INFO - Going to convert document batch...
2025-11-14 17:29:59,923 - INFO - Processing document 8-K_2024-12-12


Converted 'data\edgar_documents\PM\8-K_2024-11-01' --> 'data\processed_data\PM\8-K_2024-11-01.md'
Converted 'data\edgar_documents\PM\8-K_2024-11-21' --> 'data\processed_data\PM\8-K_2024-11-21.md'


2025-11-14 17:29:59,960 - INFO - Finished converting document 8-K_2024-12-12 in 0.08 sec.
2025-11-14 17:29:59,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,016 - INFO - Going to convert document batch...
2025-11-14 17:30:00,017 - INFO - Processing document 8-K_2024-12-17
2025-11-14 17:30:00,068 - INFO - Finished converting document 8-K_2024-12-17 in 0.09 sec.
2025-11-14 17:30:00,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,128 - INFO - Going to convert document batch...
2025-11-14 17:30:00,129 - INFO - Processing document 8-K_2025-01-02
2025-11-14 17:30:00,162 - INFO - Finished converting document 8-K_2025-01-02 in 0.06 sec.


Converted 'data\edgar_documents\PM\8-K_2024-12-12' --> 'data\processed_data\PM\8-K_2024-12-12.md'
Converted 'data\edgar_documents\PM\8-K_2024-12-17' --> 'data\processed_data\PM\8-K_2024-12-17.md'


2025-11-14 17:30:00,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,212 - INFO - Going to convert document batch...
2025-11-14 17:30:00,213 - INFO - Processing document 8-K_2025-01-16
2025-11-14 17:30:00,255 - INFO - Finished converting document 8-K_2025-01-16 in 0.08 sec.
2025-11-14 17:30:00,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,311 - INFO - Going to convert document batch...
2025-11-14 17:30:00,311 - INFO - Processing document 8-K_2025-02-06
2025-11-14 17:30:00,346 - INFO - Finished converting document 8-K_2025-02-06 in 0.08 sec.


Converted 'data\edgar_documents\PM\8-K_2025-01-02' --> 'data\processed_data\PM\8-K_2025-01-02.md'
Converted 'data\edgar_documents\PM\8-K_2025-01-16' --> 'data\processed_data\PM\8-K_2025-01-16.md'


2025-11-14 17:30:00,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,398 - INFO - Going to convert document batch...
2025-11-14 17:30:00,399 - INFO - Processing document 8-K_2025-02-19
2025-11-14 17:30:00,451 - INFO - Finished converting document 8-K_2025-02-19 in 0.09 sec.
2025-11-14 17:30:00,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,518 - INFO - Going to convert document batch...
2025-11-14 17:30:00,518 - INFO - Processing document 8-K_2025-03-06


Converted 'data\edgar_documents\PM\8-K_2025-02-06' --> 'data\processed_data\PM\8-K_2025-02-06.md'
Converted 'data\edgar_documents\PM\8-K_2025-02-19' --> 'data\processed_data\PM\8-K_2025-02-19.md'


2025-11-14 17:30:00,557 - INFO - Finished converting document 8-K_2025-03-06 in 0.09 sec.
2025-11-14 17:30:00,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,610 - INFO - Going to convert document batch...
2025-11-14 17:30:00,611 - INFO - Processing document 8-K_2025-03-07
2025-11-14 17:30:00,651 - INFO - Finished converting document 8-K_2025-03-07 in 0.08 sec.
2025-11-14 17:30:00,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,703 - INFO - Going to convert document batch...
2025-11-14 17:30:00,703 - INFO - Processing document 8-K_2025-03-25
2025-11-14 17:30:00,740 - INFO - Finished converting document 8-K_2025-03-25 in 0.06 sec.


Converted 'data\edgar_documents\PM\8-K_2025-03-06' --> 'data\processed_data\PM\8-K_2025-03-06.md'
Converted 'data\edgar_documents\PM\8-K_2025-03-07' --> 'data\processed_data\PM\8-K_2025-03-07.md'
Converted 'data\edgar_documents\PM\8-K_2025-03-25' --> 'data\processed_data\PM\8-K_2025-03-25.md'


2025-11-14 17:30:00,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,793 - INFO - Going to convert document batch...
2025-11-14 17:30:00,794 - INFO - Processing document 8-K_2025-04-23
2025-11-14 17:30:00,833 - INFO - Finished converting document 8-K_2025-04-23 in 0.08 sec.
2025-11-14 17:30:00,866 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:00,891 - INFO - Going to convert document batch...
2025-11-14 17:30:00,892 - INFO - Processing document 8-K_2025-04-30
2025-11-14 17:30:00,943 - INFO - Finished converting document 8-K_2025-04-30 in 0.09 sec.
2025-11-14 17:30:01,013 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:01,037 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PM\8-K_2025-04-23' --> 'data\processed_data\PM\8-K_2025-04-23.md'
Converted 'data\edgar_documents\PM\8-K_2025-04-30' --> 'data\processed_data\PM\8-K_2025-04-30.md'


2025-11-14 17:30:01,038 - INFO - Processing document 8-K_2025-05-07
2025-11-14 17:30:01,072 - INFO - Finished converting document 8-K_2025-05-07 in 0.09 sec.
2025-11-14 17:30:01,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:01,132 - INFO - Going to convert document batch...
2025-11-14 17:30:01,134 - INFO - Processing document 8-K_2025-05-09
2025-11-14 17:30:01,199 - INFO - Finished converting document 8-K_2025-05-09 in 0.11 sec.
2025-11-14 17:30:01,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\8-K_2025-05-07' --> 'data\processed_data\PM\8-K_2025-05-07.md'
Converted 'data\edgar_documents\PM\8-K_2025-05-09' --> 'data\processed_data\PM\8-K_2025-05-09.md'


2025-11-14 17:30:01,486 - INFO - Going to convert document batch...
2025-11-14 17:30:01,487 - INFO - Processing document 8-K_2025-06-03
2025-11-14 17:30:01,522 - INFO - Finished converting document 8-K_2025-06-03 in 0.28 sec.
2025-11-14 17:30:01,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:01,582 - INFO - Going to convert document batch...
2025-11-14 17:30:01,583 - INFO - Processing document 8-K_2025-06-06
2025-11-14 17:30:01,632 - INFO - Finished converting document 8-K_2025-06-06 in 0.09 sec.
2025-11-14 17:30:01,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:01,694 - INFO - Going to convert document batch...
2025-11-14 17:30:01,695 - INFO - Processing document 8-K_2025-06-13


Converted 'data\edgar_documents\PM\8-K_2025-06-03' --> 'data\processed_data\PM\8-K_2025-06-03.md'
Converted 'data\edgar_documents\PM\8-K_2025-06-06' --> 'data\processed_data\PM\8-K_2025-06-06.md'


2025-11-14 17:30:01,731 - INFO - Finished converting document 8-K_2025-06-13 in 0.08 sec.
2025-11-14 17:30:01,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:01,788 - INFO - Going to convert document batch...
2025-11-14 17:30:01,789 - INFO - Processing document 8-K_2025-06-24
2025-11-14 17:30:01,826 - INFO - Finished converting document 8-K_2025-06-24 in 0.08 sec.
2025-11-14 17:30:01,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:01,907 - INFO - Going to convert document batch...
2025-11-14 17:30:01,908 - INFO - Processing document 8-K_2025-07-22
2025-11-14 17:30:01,946 - INFO - Finished converting document 8-K_2025-07-22 in 0.08 sec.


Converted 'data\edgar_documents\PM\8-K_2025-06-13' --> 'data\processed_data\PM\8-K_2025-06-13.md'
Converted 'data\edgar_documents\PM\8-K_2025-06-24' --> 'data\processed_data\PM\8-K_2025-06-24.md'


2025-11-14 17:30:01,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:01,997 - INFO - Going to convert document batch...
2025-11-14 17:30:01,999 - INFO - Processing document 8-K_2025-09-02
2025-11-14 17:30:02,039 - INFO - Finished converting document 8-K_2025-09-02 in 0.06 sec.
2025-11-14 17:30:02,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:02,091 - INFO - Going to convert document batch...
2025-11-14 17:30:02,091 - INFO - Processing document 8-K_2025-09-19
2025-11-14 17:30:02,128 - INFO - Finished converting document 8-K_2025-09-19 in 0.06 sec.
2025-11-14 17:30:02,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PM\8-K_2025-07-22' --> 'data\processed_data\PM\8-K_2025-07-22.md'
Converted 'data\edgar_documents\PM\8-K_2025-09-02' --> 'data\processed_data\PM\8-K_2025-09-02.md'
Converted 'data\edgar_documents\PM\8-K_2025-09-19' --> 'data\processed_data\PM\8-K_2025-09-19.md'


2025-11-14 17:30:02,183 - INFO - Going to convert document batch...
2025-11-14 17:30:02,184 - INFO - Processing document 8-K_2025-10-21
2025-11-14 17:30:02,238 - INFO - Finished converting document 8-K_2025-10-21 in 0.09 sec.
2025-11-14 17:30:02,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:02,318 - INFO - Going to convert document batch...
2025-11-14 17:30:02,318 - INFO - Processing document 8-K_2025-10-29
2025-11-14 17:30:02,373 - INFO - Finished converting document 8-K_2025-10-29 in 0.11 sec.
2025-11-14 17:30:02,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:02,442 - INFO - Going to convert document batch...
2025-11-14 17:30:02,443 - INFO - Processing document 8-K_2025-11-04


Converted 'data\edgar_documents\PM\8-K_2025-10-21' --> 'data\processed_data\PM\8-K_2025-10-21.md'
Converted 'data\edgar_documents\PM\8-K_2025-10-29' --> 'data\processed_data\PM\8-K_2025-10-29.md'


2025-11-14 17:30:02,488 - INFO - Finished converting document 8-K_2025-11-04 in 0.08 sec.
2025-11-14 17:30:02,558 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:30:02,559 - ERROR - Input document DEF-14A_2023-03-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:30:02,561 - INFO - Going to convert document batch...
2025-11-14 17:30:02,602 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_u

Converted 'data\edgar_documents\PM\8-K_2025-11-04' --> 'data\processed_data\PM\8-K_2025-11-04.md'
Error processing data\edgar_documents\PM\DEF-14A_2023-03-23: File format not allowed: data\edgar_documents\PM\DEF-14A_2023-03-23
Error processing data\edgar_documents\PM\DEF-14A_2024-03-28: File format not allowed: data\edgar_documents\PM\DEF-14A_2024-03-28
Error processing data\edgar_documents\PM\DEF-14A_2025-03-27: File format not allowed: data\edgar_documents\PM\DEF-14A_2025-03-27
Processed 114 new files. Errors: 19
Found 118 files to process in data\edgar_documents\PYPL


2025-11-14 17:30:02,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:03,764 - INFO - Going to convert document batch...
2025-11-14 17:30:03,765 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:30:03,765 - INFO - Processing document 10-K_2023-02-10
2025-11-14 17:30:07,776 - INFO - Finished converting document 10-K_2023-02-10 in 5.12 sec.
2025-11-14 17:30:08,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-K_2023-02-10' --> 'data\processed_data\PYPL\10-K_2023-02-10.md'


2025-11-14 17:30:09,766 - INFO - Going to convert document batch...
2025-11-14 17:30:09,767 - INFO - Processing document 10-K_2024-02-08
2025-11-14 17:30:13,806 - INFO - Finished converting document 10-K_2024-02-08 in 5.20 sec.
2025-11-14 17:30:15,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-K_2024-02-08' --> 'data\processed_data\PYPL\10-K_2024-02-08.md'


2025-11-14 17:30:15,956 - INFO - Going to convert document batch...
2025-11-14 17:30:15,957 - INFO - Processing document 10-K_2025-02-04
2025-11-14 17:30:20,057 - INFO - Finished converting document 10-K_2025-02-04 in 4.92 sec.
2025-11-14 17:30:20,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-K_2025-02-04' --> 'data\processed_data\PYPL\10-K_2025-02-04.md'


2025-11-14 17:30:21,452 - INFO - Going to convert document batch...
2025-11-14 17:30:21,453 - INFO - Processing document 10-Q_2023-05-09
2025-11-14 17:30:22,821 - INFO - Finished converting document 10-Q_2023-05-09 in 1.92 sec.
2025-11-14 17:30:23,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-Q_2023-05-09' --> 'data\processed_data\PYPL\10-Q_2023-05-09.md'


2025-11-14 17:30:24,601 - INFO - Going to convert document batch...
2025-11-14 17:30:24,602 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 17:30:26,242 - INFO - Finished converting document 10-Q_2023-08-03 in 2.83 sec.
2025-11-14 17:30:26,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-Q_2023-08-03' --> 'data\processed_data\PYPL\10-Q_2023-08-03.md'


2025-11-14 17:30:27,945 - INFO - Going to convert document batch...
2025-11-14 17:30:27,946 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 17:30:29,621 - INFO - Finished converting document 10-Q_2023-11-02 in 2.72 sec.
2025-11-14 17:30:30,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-Q_2023-11-02' --> 'data\processed_data\PYPL\10-Q_2023-11-02.md'


2025-11-14 17:30:31,299 - INFO - Going to convert document batch...
2025-11-14 17:30:31,300 - INFO - Processing document 10-Q_2024-04-30
2025-11-14 17:30:32,676 - INFO - Finished converting document 10-Q_2024-04-30 in 2.36 sec.
2025-11-14 17:30:33,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-Q_2024-04-30' --> 'data\processed_data\PYPL\10-Q_2024-04-30.md'


2025-11-14 17:30:34,411 - INFO - Going to convert document batch...
2025-11-14 17:30:34,412 - INFO - Processing document 10-Q_2024-07-30
2025-11-14 17:30:36,012 - INFO - Finished converting document 10-Q_2024-07-30 in 2.73 sec.
2025-11-14 17:30:36,716 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-Q_2024-07-30' --> 'data\processed_data\PYPL\10-Q_2024-07-30.md'


2025-11-14 17:30:37,729 - INFO - Going to convert document batch...
2025-11-14 17:30:37,731 - INFO - Processing document 10-Q_2024-10-29
2025-11-14 17:30:39,338 - INFO - Finished converting document 10-Q_2024-10-29 in 2.66 sec.
2025-11-14 17:30:40,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-Q_2024-10-29' --> 'data\processed_data\PYPL\10-Q_2024-10-29.md'


2025-11-14 17:30:40,620 - INFO - Going to convert document batch...
2025-11-14 17:30:40,622 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 17:30:42,422 - INFO - Finished converting document 10-Q_2025-04-29 in 2.38 sec.
2025-11-14 17:30:43,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-Q_2025-04-29' --> 'data\processed_data\PYPL\10-Q_2025-04-29.md'


2025-11-14 17:30:43,677 - INFO - Going to convert document batch...
2025-11-14 17:30:43,678 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 17:30:45,334 - INFO - Finished converting document 10-Q_2025-07-29 in 2.31 sec.
2025-11-14 17:30:46,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\10-Q_2025-07-29' --> 'data\processed_data\PYPL\10-Q_2025-07-29.md'


2025-11-14 17:30:47,275 - INFO - Going to convert document batch...
2025-11-14 17:30:47,276 - INFO - Processing document 10-Q_2025-10-28
2025-11-14 17:30:49,242 - INFO - Finished converting document 10-Q_2025-10-28 in 2.70 sec.
2025-11-14 17:30:49,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,001 - INFO - Going to convert document batch...
2025-11-14 17:30:50,002 - INFO - Processing document 4_2023-01-05
2025-11-14 17:30:50,022 - INFO - Finished converting document 4_2023-01-05 in 0.06 sec.
2025-11-14 17:30:50,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,070 - INFO - Going to convert document batch...
2025-11-14 17:30:50,071 - INFO - Processing document 4_2023-02-17
2025-11-14 17:30:50,089 - INFO - Finished converting document 4_2023-02-17 in 0.05 sec.
2025-11-14 17:30:50,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,156 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\PYPL\10-Q_2025-10-28' --> 'data\processed_data\PYPL\10-Q_2025-10-28.md'
Converted 'data\edgar_documents\PYPL\4_2023-01-05' --> 'data\processed_data\PYPL\4_2023-01-05.md'
Converted 'data\edgar_documents\PYPL\4_2023-02-17' --> 'data\processed_data\PYPL\4_2023-02-17.md'


2025-11-14 17:30:50,157 - INFO - Processing document 4_2023-03-03
2025-11-14 17:30:50,217 - INFO - Finished converting document 4_2023-03-03 in 0.11 sec.
2025-11-14 17:30:50,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,271 - INFO - Going to convert document batch...
2025-11-14 17:30:50,271 - INFO - Processing document 4_2023-03-15
2025-11-14 17:30:50,294 - INFO - Finished converting document 4_2023-03-15 in 0.05 sec.
2025-11-14 17:30:50,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,336 - INFO - Going to convert document batch...
2025-11-14 17:30:50,336 - INFO - Processing document 4_2023-04-03
2025-11-14 17:30:50,354 - INFO - Finished converting document 4_2023-04-03 in 0.05 sec.
2025-11-14 17:30:50,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,400 - INFO - Going to convert document batch...
2025-11-14 17:30:50,400 - INFO - Processing document 4_2023-04-18
2025-11-14 17:30:50,420 - IN

Converted 'data\edgar_documents\PYPL\4_2023-03-03' --> 'data\processed_data\PYPL\4_2023-03-03.md'
Converted 'data\edgar_documents\PYPL\4_2023-03-15' --> 'data\processed_data\PYPL\4_2023-03-15.md'
Converted 'data\edgar_documents\PYPL\4_2023-04-03' --> 'data\processed_data\PYPL\4_2023-04-03.md'


2025-11-14 17:30:50,456 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,463 - INFO - Going to convert document batch...
2025-11-14 17:30:50,464 - INFO - Processing document 4_2023-05-26
2025-11-14 17:30:50,484 - INFO - Finished converting document 4_2023-05-26 in 0.05 sec.
2025-11-14 17:30:50,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,534 - INFO - Going to convert document batch...
2025-11-14 17:30:50,535 - INFO - Processing document 4_2023-06-02
2025-11-14 17:30:50,576 - INFO - Finished converting document 4_2023-06-02 in 0.06 sec.
2025-11-14 17:30:50,633 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\PYPL\4_2023-04-18' --> 'data\processed_data\PYPL\4_2023-04-18.md'
Converted 'data\edgar_documents\PYPL\4_2023-05-26' --> 'data\processed_data\PYPL\4_2023-05-26.md'
Converted 'data\edgar_documents\PYPL\4_2023-06-02' --> 'data\processed_data\PYPL\4_2023-06-02.md'


2025-11-14 17:30:50,634 - ERROR - Input document 4_2023-06-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:30:50,635 - INFO - Going to convert document batch...
2025-11-14 17:30:50,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,661 - INFO - Going to convert document batch...
2025-11-14 17:30:50,662 - INFO - Processing document 4_2023-06-16
2025-11-14 17:30:50,684 - INFO - Finished converting document 4_2023-06-16 in 0.05 sec.
2025-11-14 17:30:50,731 - INFO - detec

Error processing data\edgar_documents\PYPL\4_2023-06-05: File format not allowed: data\edgar_documents\PYPL\4_2023-06-05
Converted 'data\edgar_documents\PYPL\4_2023-06-16' --> 'data\processed_data\PYPL\4_2023-06-16.md'
Converted 'data\edgar_documents\PYPL\4_2023-09-05' --> 'data\processed_data\PYPL\4_2023-09-05.md'


2025-11-14 17:30:50,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,865 - INFO - Going to convert document batch...
2025-11-14 17:30:50,866 - INFO - Processing document 4_2023-09-18
2025-11-14 17:30:50,890 - INFO - Finished converting document 4_2023-09-18 in 0.05 sec.
2025-11-14 17:30:50,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,933 - INFO - Going to convert document batch...
2025-11-14 17:30:50,934 - INFO - Processing document 4_2023-09-29
2025-11-14 17:30:50,956 - INFO - Finished converting document 4_2023-09-29 in 0.05 sec.
2025-11-14 17:30:50,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:50,997 - INFO - Going to convert document batch...
2025-11-14 17:30:50,997 - INFO - Processing document 4_2023-10-17
2025-11-14 17:30:51,018 - INFO - Finished converting document 4_2023-10-17 in 0.05 sec.
2025-11-14 17:30:51,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\4_2023-09-12' --> 'data\processed_data\PYPL\4_2023-09-12.md'
Converted 'data\edgar_documents\PYPL\4_2023-09-18' --> 'data\processed_data\PYPL\4_2023-09-18.md'
Converted 'data\edgar_documents\PYPL\4_2023-09-29' --> 'data\processed_data\PYPL\4_2023-09-29.md'
Converted 'data\edgar_documents\PYPL\4_2023-10-17' --> 'data\processed_data\PYPL\4_2023-10-17.md'


2025-11-14 17:30:51,082 - INFO - Going to convert document batch...
2025-11-14 17:30:51,084 - INFO - Processing document 4_2023-11-22
2025-11-14 17:30:51,110 - INFO - Finished converting document 4_2023-11-22 in 0.08 sec.
2025-11-14 17:30:51,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,160 - INFO - Going to convert document batch...
2025-11-14 17:30:51,162 - INFO - Processing document 4_2023-11-28
2025-11-14 17:30:51,180 - INFO - Finished converting document 4_2023-11-28 in 0.03 sec.
2025-11-14 17:30:51,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,223 - INFO - Going to convert document batch...
2025-11-14 17:30:51,224 - INFO - Processing document 4_2023-12-04
2025-11-14 17:30:51,246 - INFO - Finished converting document 4_2023-12-04 in 0.05 sec.
2025-11-14 17:30:51,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,286 - INFO - Going to convert document batch...
2025-11-14 17:30:51,287 - 

Converted 'data\edgar_documents\PYPL\4_2023-11-22' --> 'data\processed_data\PYPL\4_2023-11-22.md'
Converted 'data\edgar_documents\PYPL\4_2023-11-28' --> 'data\processed_data\PYPL\4_2023-11-28.md'
Converted 'data\edgar_documents\PYPL\4_2023-12-04' --> 'data\processed_data\PYPL\4_2023-12-04.md'


2025-11-14 17:30:51,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,345 - INFO - Going to convert document batch...
2025-11-14 17:30:51,346 - INFO - Processing document 4_2023-12-15
2025-11-14 17:30:51,368 - INFO - Finished converting document 4_2023-12-15 in 0.03 sec.
2025-11-14 17:30:51,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,413 - INFO - Going to convert document batch...
2025-11-14 17:30:51,414 - INFO - Processing document 4_2024-01-03
2025-11-14 17:30:51,431 - INFO - Finished converting document 4_2024-01-03 in 0.03 sec.
2025-11-14 17:30:51,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,470 - INFO - Going to convert document batch...
2025-11-14 17:30:51,471 - INFO - Processing document 4_2024-01-17
2025-11-14 17:30:51,489 - INFO - Finished converting document 4_2024-01-17 in 0.03 sec.


Converted 'data\edgar_documents\PYPL\4_2023-12-13' --> 'data\processed_data\PYPL\4_2023-12-13.md'
Converted 'data\edgar_documents\PYPL\4_2023-12-15' --> 'data\processed_data\PYPL\4_2023-12-15.md'
Converted 'data\edgar_documents\PYPL\4_2024-01-03' --> 'data\processed_data\PYPL\4_2024-01-03.md'
Converted 'data\edgar_documents\PYPL\4_2024-01-17' --> 'data\processed_data\PYPL\4_2024-01-17.md'


2025-11-14 17:30:51,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,551 - INFO - Going to convert document batch...
2025-11-14 17:30:51,552 - INFO - Processing document 4_2024-02-16
2025-11-14 17:30:51,573 - INFO - Finished converting document 4_2024-02-16 in 0.08 sec.
2025-11-14 17:30:51,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,616 - INFO - Going to convert document batch...
2025-11-14 17:30:51,617 - INFO - Processing document 4_2024-03-04
2025-11-14 17:30:51,634 - INFO - Finished converting document 4_2024-03-04 in 0.03 sec.
2025-11-14 17:30:51,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,675 - INFO - Going to convert document batch...
2025-11-14 17:30:51,676 - INFO - Processing document 4_2024-04-16
2025-11-14 17:30:51,698 - INFO - Finished converting document 4_2024-04-16 in 0.05 sec.
2025-11-14 17:30:51,739 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025

Converted 'data\edgar_documents\PYPL\4_2024-02-16' --> 'data\processed_data\PYPL\4_2024-02-16.md'
Converted 'data\edgar_documents\PYPL\4_2024-03-04' --> 'data\processed_data\PYPL\4_2024-03-04.md'
Converted 'data\edgar_documents\PYPL\4_2024-04-16' --> 'data\processed_data\PYPL\4_2024-04-16.md'
Error processing data\edgar_documents\PYPL\4_2024-05-20: File format not allowed: data\edgar_documents\PYPL\4_2024-05-20
Error processing data\edgar_documents\PYPL\4_2024-05-22: File format not allowed: data\edgar_documents\PYPL\4_2024-05-22


2025-11-14 17:30:51,785 - INFO - Going to convert document batch...
2025-11-14 17:30:51,786 - INFO - Processing document 4_2024-05-23
2025-11-14 17:30:51,803 - INFO - Finished converting document 4_2024-05-23 in 0.03 sec.
2025-11-14 17:30:51,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,843 - INFO - Going to convert document batch...
2025-11-14 17:30:51,844 - INFO - Processing document 4_2024-05-24
2025-11-14 17:30:51,860 - INFO - Finished converting document 4_2024-05-24 in 0.05 sec.
2025-11-14 17:30:51,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,907 - INFO - Going to convert document batch...
2025-11-14 17:30:51,908 - INFO - Processing document 4_2024-06-03
2025-11-14 17:30:51,937 - INFO - Finished converting document 4_2024-06-03 in 0.06 sec.
2025-11-14 17:30:51,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:51,981 - INFO - Going to convert document batch...
2025-11-14 17:30:51,982 - 

Converted 'data\edgar_documents\PYPL\4_2024-05-23' --> 'data\processed_data\PYPL\4_2024-05-23.md'
Converted 'data\edgar_documents\PYPL\4_2024-05-24' --> 'data\processed_data\PYPL\4_2024-05-24.md'
Converted 'data\edgar_documents\PYPL\4_2024-06-03' --> 'data\processed_data\PYPL\4_2024-06-03.md'


2025-11-14 17:30:51,999 - INFO - Finished converting document 4_2024-07-03 in 0.03 sec.
2025-11-14 17:30:52,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,043 - INFO - Going to convert document batch...
2025-11-14 17:30:52,044 - INFO - Processing document 4_2024-07-16
2025-11-14 17:30:52,065 - INFO - Finished converting document 4_2024-07-16 in 0.05 sec.
2025-11-14 17:30:52,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,116 - INFO - Going to convert document batch...
2025-11-14 17:30:52,117 - INFO - Processing document 4_2024-09-03
2025-11-14 17:30:52,151 - INFO - Finished converting document 4_2024-09-03 in 0.06 sec.
2025-11-14 17:30:52,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\4_2024-07-03' --> 'data\processed_data\PYPL\4_2024-07-03.md'
Converted 'data\edgar_documents\PYPL\4_2024-07-16' --> 'data\processed_data\PYPL\4_2024-07-16.md'
Converted 'data\edgar_documents\PYPL\4_2024-09-03' --> 'data\processed_data\PYPL\4_2024-09-03.md'


2025-11-14 17:30:52,211 - INFO - Going to convert document batch...
2025-11-14 17:30:52,212 - INFO - Processing document 4_2024-10-15
2025-11-14 17:30:52,236 - INFO - Finished converting document 4_2024-10-15 in 0.06 sec.
2025-11-14 17:30:52,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,289 - INFO - Going to convert document batch...
2025-11-14 17:30:52,290 - INFO - Processing document 4_2024-12-02
2025-11-14 17:30:52,322 - INFO - Finished converting document 4_2024-12-02 in 0.05 sec.
2025-11-14 17:30:52,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,371 - INFO - Going to convert document batch...
2025-11-14 17:30:52,372 - INFO - Processing document 4_2024-12-16
2025-11-14 17:30:52,396 - INFO - Finished converting document 4_2024-12-16 in 0.05 sec.
2025-11-14 17:30:52,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,436 - INFO - Going to convert document batch...
2025-11-14 17:30:52,437 - 

Converted 'data\edgar_documents\PYPL\4_2024-10-15' --> 'data\processed_data\PYPL\4_2024-10-15.md'
Converted 'data\edgar_documents\PYPL\4_2024-12-02' --> 'data\processed_data\PYPL\4_2024-12-02.md'
Converted 'data\edgar_documents\PYPL\4_2024-12-16' --> 'data\processed_data\PYPL\4_2024-12-16.md'


2025-11-14 17:30:52,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,499 - INFO - Going to convert document batch...
2025-11-14 17:30:52,500 - INFO - Processing document 4_2025-01-17
2025-11-14 17:30:52,520 - INFO - Finished converting document 4_2025-01-17 in 0.05 sec.
2025-11-14 17:30:52,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,569 - INFO - Going to convert document batch...
2025-11-14 17:30:52,570 - INFO - Processing document 4_2025-02-18
2025-11-14 17:30:52,598 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 17:30:52,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,640 - INFO - Going to convert document batch...
2025-11-14 17:30:52,640 - INFO - Processing document 4_2025-02-28
2025-11-14 17:30:52,657 - INFO - Finished converting document 4_2025-02-28 in 0.03 sec.


Converted 'data\edgar_documents\PYPL\4_2025-01-03' --> 'data\processed_data\PYPL\4_2025-01-03.md'
Converted 'data\edgar_documents\PYPL\4_2025-01-17' --> 'data\processed_data\PYPL\4_2025-01-17.md'
Converted 'data\edgar_documents\PYPL\4_2025-02-18' --> 'data\processed_data\PYPL\4_2025-02-18.md'


2025-11-14 17:30:52,694 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:30:52,695 - ERROR - Input document 4_2025-03-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:30:52,696 - INFO - Going to convert document batch...
2025-11-14 17:30:52,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,718 - INFO - Going to convert document batch...
2025-11-14 17:30:52,719 - INFO - Processing document 4_2025-03-04
2025-11-14 17:30:52,739 - INFO - Fin

Converted 'data\edgar_documents\PYPL\4_2025-02-28' --> 'data\processed_data\PYPL\4_2025-02-28.md'
Error processing data\edgar_documents\PYPL\4_2025-03-03: File format not allowed: data\edgar_documents\PYPL\4_2025-03-03
Converted 'data\edgar_documents\PYPL\4_2025-03-04' --> 'data\processed_data\PYPL\4_2025-03-04.md'
Error processing data\edgar_documents\PYPL\4_2025-03-05: File format not allowed: data\edgar_documents\PYPL\4_2025-03-05
Converted 'data\edgar_documents\PYPL\4_2025-03-11' --> 'data\processed_data\PYPL\4_2025-03-11.md'


2025-11-14 17:30:52,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:52,908 - INFO - Going to convert document batch...
2025-11-14 17:30:52,909 - INFO - Processing document 4_2025-03-18
2025-11-14 17:30:52,932 - INFO - Finished converting document 4_2025-03-18 in 0.06 sec.
2025-11-14 17:30:52,977 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,000 - INFO - Going to convert document batch...
2025-11-14 17:30:53,002 - INFO - Processing document 4_2025-04-16
2025-11-14 17:30:53,036 - INFO - Finished converting document 4_2025-04-16 in 0.08 sec.
2025-11-14 17:30:53,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,083 - INFO - Going to convert document batch...
2025-11-14 17:30:53,084 - INFO - Processing document 4_2025-05-15
2025-11-14 17:30:53,105 - INFO - Finished converting document 4_2025-05-15 in 0.05 sec.
2025-11-14 17:30:53,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\4_2025-03-18' --> 'data\processed_data\PYPL\4_2025-03-18.md'
Converted 'data\edgar_documents\PYPL\4_2025-04-16' --> 'data\processed_data\PYPL\4_2025-04-16.md'
Converted 'data\edgar_documents\PYPL\4_2025-05-15' --> 'data\processed_data\PYPL\4_2025-05-15.md'


2025-11-14 17:30:53,164 - INFO - Going to convert document batch...
2025-11-14 17:30:53,165 - INFO - Processing document 4_2025-06-03
2025-11-14 17:30:53,195 - INFO - Finished converting document 4_2025-06-03 in 0.06 sec.
2025-11-14 17:30:53,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,242 - INFO - Going to convert document batch...
2025-11-14 17:30:53,243 - INFO - Processing document 4_2025-06-06
2025-11-14 17:30:53,262 - INFO - Finished converting document 4_2025-06-06 in 0.05 sec.
2025-11-14 17:30:53,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,307 - INFO - Going to convert document batch...
2025-11-14 17:30:53,309 - INFO - Processing document 4_2025-06-09
2025-11-14 17:30:53,352 - INFO - Finished converting document 4_2025-06-09 in 0.06 sec.
2025-11-14 17:30:53,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,395 - INFO - Going to convert document batch...
2025-11-14 17:30:53,395 - 

Converted 'data\edgar_documents\PYPL\4_2025-06-03' --> 'data\processed_data\PYPL\4_2025-06-03.md'
Converted 'data\edgar_documents\PYPL\4_2025-06-06' --> 'data\processed_data\PYPL\4_2025-06-06.md'
Converted 'data\edgar_documents\PYPL\4_2025-06-09' --> 'data\processed_data\PYPL\4_2025-06-09.md'


2025-11-14 17:30:53,422 - INFO - Finished converting document 4_2025-06-17 in 0.05 sec.
2025-11-14 17:30:53,456 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,466 - INFO - Going to convert document batch...
2025-11-14 17:30:53,466 - INFO - Processing document 4_2025-06-24
2025-11-14 17:30:53,490 - INFO - Finished converting document 4_2025-06-24 in 0.05 sec.
2025-11-14 17:30:53,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,550 - INFO - Going to convert document batch...
2025-11-14 17:30:53,551 - INFO - Processing document 4_2025-06-25
2025-11-14 17:30:53,570 - INFO - Finished converting document 4_2025-06-25 in 0.05 sec.
2025-11-14 17:30:53,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,613 - INFO - Going to convert document batch...
2025-11-14 17:30:53,614 - INFO - Processing document 4_2025-07-16
2025-11-14 17:30:53,638 - INFO - Finished converting document 4_2025-07-16 in 0.05 sec.


Converted 'data\edgar_documents\PYPL\4_2025-06-17' --> 'data\processed_data\PYPL\4_2025-06-17.md'
Converted 'data\edgar_documents\PYPL\4_2025-06-24' --> 'data\processed_data\PYPL\4_2025-06-24.md'
Converted 'data\edgar_documents\PYPL\4_2025-06-25' --> 'data\processed_data\PYPL\4_2025-06-25.md'


2025-11-14 17:30:53,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,683 - INFO - Going to convert document batch...
2025-11-14 17:30:53,684 - INFO - Processing document 4_2025-08-01
2025-11-14 17:30:53,704 - INFO - Finished converting document 4_2025-08-01 in 0.05 sec.
2025-11-14 17:30:53,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,745 - INFO - Going to convert document batch...
2025-11-14 17:30:53,746 - INFO - Processing document 4_2025-08-18
2025-11-14 17:30:53,770 - INFO - Finished converting document 4_2025-08-18 in 0.05 sec.
2025-11-14 17:30:53,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,814 - INFO - Going to convert document batch...
2025-11-14 17:30:53,814 - INFO - Processing document 4_2025-08-20
2025-11-14 17:30:53,832 - INFO - Finished converting document 4_2025-08-20 in 0.03 sec.


Converted 'data\edgar_documents\PYPL\4_2025-07-16' --> 'data\processed_data\PYPL\4_2025-07-16.md'
Converted 'data\edgar_documents\PYPL\4_2025-08-01' --> 'data\processed_data\PYPL\4_2025-08-01.md'
Converted 'data\edgar_documents\PYPL\4_2025-08-18' --> 'data\processed_data\PYPL\4_2025-08-18.md'


2025-11-14 17:30:53,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,878 - INFO - Going to convert document batch...
2025-11-14 17:30:53,879 - INFO - Processing document 4_2025-09-02
2025-11-14 17:30:53,908 - INFO - Finished converting document 4_2025-09-02 in 0.06 sec.
2025-11-14 17:30:53,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:53,971 - INFO - Going to convert document batch...
2025-11-14 17:30:53,971 - INFO - Processing document 4_2025-09-15
2025-11-14 17:30:53,997 - INFO - Finished converting document 4_2025-09-15 in 0.06 sec.
2025-11-14 17:30:54,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\4_2025-08-20' --> 'data\processed_data\PYPL\4_2025-08-20.md'
Converted 'data\edgar_documents\PYPL\4_2025-09-02' --> 'data\processed_data\PYPL\4_2025-09-02.md'
Converted 'data\edgar_documents\PYPL\4_2025-09-15' --> 'data\processed_data\PYPL\4_2025-09-15.md'


2025-11-14 17:30:54,041 - INFO - Going to convert document batch...
2025-11-14 17:30:54,042 - INFO - Processing document 4_2025-10-16
2025-11-14 17:30:54,084 - INFO - Finished converting document 4_2025-10-16 in 0.06 sec.
2025-11-14 17:30:54,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,128 - INFO - Going to convert document batch...
2025-11-14 17:30:54,129 - INFO - Processing document 4_2025-10-31
2025-11-14 17:30:54,149 - INFO - Finished converting document 4_2025-10-31 in 0.03 sec.
2025-11-14 17:30:54,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,191 - INFO - Going to convert document batch...
2025-11-14 17:30:54,192 - INFO - Processing document 4_2025-11-04
2025-11-14 17:30:54,209 - INFO - Finished converting document 4_2025-11-04 in 0.03 sec.
2025-11-14 17:30:54,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,252 - INFO - Going to convert document batch...
2025-11-14 17:30:54,252 - 

Converted 'data\edgar_documents\PYPL\4_2025-10-16' --> 'data\processed_data\PYPL\4_2025-10-16.md'
Converted 'data\edgar_documents\PYPL\4_2025-10-31' --> 'data\processed_data\PYPL\4_2025-10-31.md'
Converted 'data\edgar_documents\PYPL\4_2025-11-04' --> 'data\processed_data\PYPL\4_2025-11-04.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-01-09' --> 'data\processed_data\PYPL\8-K_2023-01-09.md'


2025-11-14 17:30:54,301 - INFO - Processing document 8-K_2023-02-09
2025-11-14 17:30:54,317 - INFO - Finished converting document 8-K_2023-02-09 in 0.05 sec.
2025-11-14 17:30:54,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,352 - INFO - Going to convert document batch...
2025-11-14 17:30:54,353 - INFO - Processing document 8-K_2023-02-16
2025-11-14 17:30:54,365 - INFO - Finished converting document 8-K_2023-02-16 in 0.03 sec.
2025-11-14 17:30:54,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,395 - INFO - Going to convert document batch...
2025-11-14 17:30:54,396 - INFO - Processing document 8-K_2023-03-07
2025-11-14 17:30:54,410 - INFO - Finished converting document 8-K_2023-03-07 in 0.03 sec.
2025-11-14 17:30:54,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,441 - INFO - Going to convert document batch...
2025-11-14 17:30:54,442 - INFO - Processing document 8-K_2023-05-08
2025-11-14 17:

Converted 'data\edgar_documents\PYPL\8-K_2023-02-09' --> 'data\processed_data\PYPL\8-K_2023-02-09.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-02-16' --> 'data\processed_data\PYPL\8-K_2023-02-16.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-03-07' --> 'data\processed_data\PYPL\8-K_2023-03-07.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-05-08' --> 'data\processed_data\PYPL\8-K_2023-05-08.md'


2025-11-14 17:30:54,540 - INFO - Finished converting document 8-K_2023-05-31 in 0.08 sec.
2025-11-14 17:30:54,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,581 - INFO - Going to convert document batch...
2025-11-14 17:30:54,582 - INFO - Processing document 8-K_2023-06-02
2025-11-14 17:30:54,601 - INFO - Finished converting document 8-K_2023-06-02 in 0.03 sec.
2025-11-14 17:30:54,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,646 - INFO - Going to convert document batch...
2025-11-14 17:30:54,648 - INFO - Processing document 8-K_2023-06-09
2025-11-14 17:30:54,679 - INFO - Finished converting document 8-K_2023-06-09 in 0.06 sec.
2025-11-14 17:30:54,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,716 - INFO - Going to convert document batch...
2025-11-14 17:30:54,717 - INFO - Processing document 8-K_2023-06-13
2025-11-14 17:30:54,737 - INFO - Finished converting document 8-K_2023-06-13 in 0.

Converted 'data\edgar_documents\PYPL\8-K_2023-05-31' --> 'data\processed_data\PYPL\8-K_2023-05-31.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-06-02' --> 'data\processed_data\PYPL\8-K_2023-06-02.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-06-09' --> 'data\processed_data\PYPL\8-K_2023-06-09.md'


2025-11-14 17:30:54,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,770 - INFO - Going to convert document batch...
2025-11-14 17:30:54,771 - INFO - Processing document 8-K_2023-06-22
2025-11-14 17:30:54,794 - INFO - Finished converting document 8-K_2023-06-22 in 0.05 sec.
2025-11-14 17:30:54,820 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,832 - INFO - Going to convert document batch...
2025-11-14 17:30:54,833 - INFO - Processing document 8-K_2023-08-02
2025-11-14 17:30:54,847 - INFO - Finished converting document 8-K_2023-08-02 in 0.03 sec.
2025-11-14 17:30:54,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:54,887 - INFO - Going to convert document batch...
2025-11-14 17:30:54,888 - INFO - Processing document 8-K_2023-08-08
2025-11-14 17:30:54,914 - INFO - Finished converting document 8-K_2023-08-08 in 0.05 sec.
2025-11-14 17:30:54,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\PYPL\8-K_2023-06-13' --> 'data\processed_data\PYPL\8-K_2023-06-13.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-06-22' --> 'data\processed_data\PYPL\8-K_2023-06-22.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-08-02' --> 'data\processed_data\PYPL\8-K_2023-08-02.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-08-08' --> 'data\processed_data\PYPL\8-K_2023-08-08.md'


2025-11-14 17:30:54,950 - INFO - Going to convert document batch...
2025-11-14 17:30:54,951 - INFO - Processing document 8-K_2023-08-14
2025-11-14 17:30:54,978 - INFO - Finished converting document 8-K_2023-08-14 in 0.05 sec.
2025-11-14 17:30:55,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,019 - INFO - Going to convert document batch...
2025-11-14 17:30:55,020 - INFO - Processing document 8-K_2023-10-02
2025-11-14 17:30:55,035 - INFO - Finished converting document 8-K_2023-10-02 in 0.05 sec.
2025-11-14 17:30:55,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,067 - INFO - Going to convert document batch...
2025-11-14 17:30:55,068 - INFO - Processing document 8-K_2023-11-01
2025-11-14 17:30:55,087 - INFO - Finished converting document 8-K_2023-11-01 in 0.03 sec.
2025-11-14 17:30:55,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,120 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\PYPL\8-K_2023-08-14' --> 'data\processed_data\PYPL\8-K_2023-08-14.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-10-02' --> 'data\processed_data\PYPL\8-K_2023-10-02.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-11-01' --> 'data\processed_data\PYPL\8-K_2023-11-01.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-12-06' --> 'data\processed_data\PYPL\8-K_2023-12-06.md'


2025-11-14 17:30:55,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,202 - INFO - Going to convert document batch...
2025-11-14 17:30:55,204 - INFO - Processing document 8-K_2023-12-22
2025-11-14 17:30:55,221 - INFO - Finished converting document 8-K_2023-12-22 in 0.05 sec.
2025-11-14 17:30:55,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,262 - INFO - Going to convert document batch...
2025-11-14 17:30:55,262 - INFO - Processing document 8-K_2024-01-08
2025-11-14 17:30:55,277 - INFO - Finished converting document 8-K_2024-01-08 in 0.05 sec.
2025-11-14 17:30:55,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,308 - INFO - Going to convert document batch...
2025-11-14 17:30:55,308 - INFO - Processing document 8-K_2024-02-07
2025-11-14 17:30:55,324 - INFO - Finished converting document 8-K_2024-02-07 in 0.05 sec.
2025-11-14 17:30:55,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\PYPL\8-K_2023-12-14' --> 'data\processed_data\PYPL\8-K_2023-12-14.md'
Converted 'data\edgar_documents\PYPL\8-K_2023-12-22' --> 'data\processed_data\PYPL\8-K_2023-12-22.md'
Converted 'data\edgar_documents\PYPL\8-K_2024-01-08' --> 'data\processed_data\PYPL\8-K_2024-01-08.md'
Converted 'data\edgar_documents\PYPL\8-K_2024-02-07' --> 'data\processed_data\PYPL\8-K_2024-02-07.md'


2025-11-14 17:30:55,357 - INFO - Processing document 8-K_2024-02-12
2025-11-14 17:30:55,373 - INFO - Finished converting document 8-K_2024-02-12 in 0.05 sec.
2025-11-14 17:30:55,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,410 - INFO - Going to convert document batch...
2025-11-14 17:30:55,411 - INFO - Processing document 8-K_2024-03-28
2025-11-14 17:30:55,428 - INFO - Finished converting document 8-K_2024-03-28 in 0.05 sec.
2025-11-14 17:30:55,454 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,482 - INFO - Going to convert document batch...
2025-11-14 17:30:55,483 - INFO - Processing document 8-K_2024-04-30
2025-11-14 17:30:55,535 - INFO - Finished converting document 8-K_2024-04-30 in 0.09 sec.


Converted 'data\edgar_documents\PYPL\8-K_2024-02-12' --> 'data\processed_data\PYPL\8-K_2024-02-12.md'
Converted 'data\edgar_documents\PYPL\8-K_2024-03-28' --> 'data\processed_data\PYPL\8-K_2024-03-28.md'


2025-11-14 17:30:55,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,580 - INFO - Going to convert document batch...
2025-11-14 17:30:55,582 - INFO - Processing document 8-K_2024-05-21
2025-11-14 17:30:55,598 - INFO - Finished converting document 8-K_2024-05-21 in 0.03 sec.
2025-11-14 17:30:55,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:55,667 - INFO - Going to convert document batch...
2025-11-14 17:30:55,669 - INFO - Processing document 8-K_2024-05-28


Converted 'data\edgar_documents\PYPL\8-K_2024-04-30' --> 'data\processed_data\PYPL\8-K_2024-04-30.md'
Converted 'data\edgar_documents\PYPL\8-K_2024-05-21' --> 'data\processed_data\PYPL\8-K_2024-05-21.md'


2025-11-14 17:30:56,248 - INFO - Finished converting document 8-K_2024-05-28 in 0.62 sec.
2025-11-14 17:30:56,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:56,286 - INFO - Going to convert document batch...
2025-11-14 17:30:56,287 - INFO - Processing document 8-K_2024-06-03
2025-11-14 17:30:56,307 - INFO - Finished converting document 8-K_2024-06-03 in 0.05 sec.
2025-11-14 17:30:56,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:56,335 - INFO - Going to convert document batch...
2025-11-14 17:30:56,335 - INFO - Processing document 8-K_2024-06-28
2025-11-14 17:30:56,347 - INFO - Finished converting document 8-K_2024-06-28 in 0.03 sec.
2025-11-14 17:30:56,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:56,375 - INFO - Going to convert document batch...
2025-11-14 17:30:56,376 - INFO - Processing document 8-K_2024-07-25
2025-11-14 17:30:56,393 - INFO - Finished converting document 8-K_2024-07-25 in 0.

Converted 'data\edgar_documents\PYPL\8-K_2024-05-28' --> 'data\processed_data\PYPL\8-K_2024-05-28.md'
Converted 'data\edgar_documents\PYPL\8-K_2024-06-03' --> 'data\processed_data\PYPL\8-K_2024-06-03.md'
Converted 'data\edgar_documents\PYPL\8-K_2024-06-28' --> 'data\processed_data\PYPL\8-K_2024-06-28.md'
Converted 'data\edgar_documents\PYPL\8-K_2024-07-25' --> 'data\processed_data\PYPL\8-K_2024-07-25.md'
Converted 'data\edgar_documents\PYPL\8-K_2024-07-30' --> 'data\processed_data\PYPL\8-K_2024-07-30.md'


2025-11-14 17:30:56,464 - INFO - Going to convert document batch...
2025-11-14 17:30:56,464 - INFO - Processing document 8-K_2024-10-29
2025-11-14 17:30:56,479 - INFO - Finished converting document 8-K_2024-10-29 in 0.05 sec.
2025-11-14 17:30:56,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:56,512 - INFO - Going to convert document batch...
2025-11-14 17:30:56,512 - INFO - Processing document 8-K_2025-01-22
2025-11-14 17:30:56,533 - INFO - Finished converting document 8-K_2025-01-22 in 0.05 sec.
2025-11-14 17:30:56,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:56,576 - INFO - Going to convert document batch...
2025-11-14 17:30:56,578 - INFO - Processing document 8-K_2025-02-04
2025-11-14 17:30:56,595 - INFO - Finished converting document 8-K_2025-02-04 in 0.05 sec.
2025-11-14 17:30:56,617 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:56,625 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\PYPL\8-K_2024-10-29' --> 'data\processed_data\PYPL\8-K_2024-10-29.md'
Converted 'data\edgar_documents\PYPL\8-K_2025-01-22' --> 'data\processed_data\PYPL\8-K_2025-01-22.md'
Converted 'data\edgar_documents\PYPL\8-K_2025-02-04' --> 'data\processed_data\PYPL\8-K_2025-02-04.md'
Converted 'data\edgar_documents\PYPL\8-K_2025-02-25' --> 'data\processed_data\PYPL\8-K_2025-02-25.md'


2025-11-14 17:30:56,676 - INFO - Processing document 8-K_2025-03-06
2025-11-14 17:30:56,697 - INFO - Finished converting document 8-K_2025-03-06 in 0.03 sec.
2025-11-14 17:30:56,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:56,736 - INFO - Going to convert document batch...
2025-11-14 17:30:56,737 - INFO - Processing document 8-K_2025-03-10
2025-11-14 17:30:56,753 - INFO - Finished converting document 8-K_2025-03-10 in 0.05 sec.
2025-11-14 17:30:56,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:56,806 - INFO - Going to convert document batch...
2025-11-14 17:30:56,807 - INFO - Processing document 8-K_2025-04-07
2025-11-14 17:30:56,821 - INFO - Finished converting document 8-K_2025-04-07 in 0.05 sec.
2025-11-14 17:30:56,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:56,850 - INFO - Going to convert document batch...
2025-11-14 17:30:56,851 - INFO - Processing document 8-K_2025-04-29
2025-11-14 17:

Converted 'data\edgar_documents\PYPL\8-K_2025-03-06' --> 'data\processed_data\PYPL\8-K_2025-03-06.md'
Converted 'data\edgar_documents\PYPL\8-K_2025-03-10' --> 'data\processed_data\PYPL\8-K_2025-03-10.md'
Converted 'data\edgar_documents\PYPL\8-K_2025-04-07' --> 'data\processed_data\PYPL\8-K_2025-04-07.md'
Converted 'data\edgar_documents\PYPL\8-K_2025-04-29' --> 'data\processed_data\PYPL\8-K_2025-04-29.md'


2025-11-14 17:30:56,904 - INFO - Going to convert document batch...
2025-11-14 17:30:56,905 - INFO - Processing document 8-K_2025-06-09
2025-11-14 17:30:56,954 - INFO - Finished converting document 8-K_2025-06-09 in 0.08 sec.
2025-11-14 17:30:57,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:57,014 - INFO - Going to convert document batch...
2025-11-14 17:30:57,015 - INFO - Processing document 8-K_2025-06-24
2025-11-14 17:30:57,033 - INFO - Finished converting document 8-K_2025-06-24 in 0.05 sec.
2025-11-14 17:30:57,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:57,079 - INFO - Going to convert document batch...
2025-11-14 17:30:57,080 - INFO - Processing document 8-K_2025-07-29
2025-11-14 17:30:57,094 - INFO - Finished converting document 8-K_2025-07-29 in 0.05 sec.
2025-11-14 17:30:57,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:30:57,120 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\PYPL\8-K_2025-06-09' --> 'data\processed_data\PYPL\8-K_2025-06-09.md'
Converted 'data\edgar_documents\PYPL\8-K_2025-06-24' --> 'data\processed_data\PYPL\8-K_2025-06-24.md'
Converted 'data\edgar_documents\PYPL\8-K_2025-07-29' --> 'data\processed_data\PYPL\8-K_2025-07-29.md'
Converted 'data\edgar_documents\PYPL\8-K_2025-10-28' --> 'data\processed_data\PYPL\8-K_2025-10-28.md'


2025-11-14 17:30:57,182 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:30:57,183 - ERROR - Input document DEF-14A_2023-04-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:30:57,186 - INFO - Going to convert document batch...
2025-11-14 17:30:57,239 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:30:57,240 - ERROR - Input document DEF-14A_2024-04-09 with format No

Error processing data\edgar_documents\PYPL\DEF-14A_2023-04-13: File format not allowed: data\edgar_documents\PYPL\DEF-14A_2023-04-13
Error processing data\edgar_documents\PYPL\DEF-14A_2024-04-09: File format not allowed: data\edgar_documents\PYPL\DEF-14A_2024-04-09
Error processing data\edgar_documents\PYPL\DEF-14A_2025-04-21: File format not allowed: data\edgar_documents\PYPL\DEF-14A_2025-04-21
Processed 110 new files. Errors: 8
Found 143 files to process in data\edgar_documents\QCOM
Error processing data\edgar_documents\QCOM\10-K_2023-11-01: File format not allowed: data\edgar_documents\QCOM\10-K_2023-11-01


2025-11-14 17:30:57,741 - INFO - Going to convert document batch...
2025-11-14 17:30:57,741 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:30:57,743 - INFO - Processing document 10-K_2024-11-06
2025-11-14 17:30:58,674 - INFO - Finished converting document 10-K_2024-11-06 in 1.34 sec.
2025-11-14 17:30:59,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-K_2024-11-06' --> 'data\processed_data\QCOM\10-K_2024-11-06.md'


2025-11-14 17:30:59,676 - INFO - Going to convert document batch...
2025-11-14 17:30:59,677 - INFO - Processing document 10-K_2025-11-05
2025-11-14 17:31:00,485 - INFO - Finished converting document 10-K_2025-11-05 in 1.44 sec.
2025-11-14 17:31:00,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-K_2025-11-05' --> 'data\processed_data\QCOM\10-K_2025-11-05.md'


2025-11-14 17:31:01,161 - INFO - Going to convert document batch...
2025-11-14 17:31:01,162 - INFO - Processing document 10-Q_2023-02-02
2025-11-14 17:31:01,742 - INFO - Finished converting document 10-Q_2023-02-02 in 0.86 sec.
2025-11-14 17:31:02,076 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-Q_2023-02-02' --> 'data\processed_data\QCOM\10-Q_2023-02-02.md'


2025-11-14 17:31:02,663 - INFO - Going to convert document batch...
2025-11-14 17:31:02,663 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 17:31:03,240 - INFO - Finished converting document 10-Q_2023-05-03 in 1.19 sec.
2025-11-14 17:31:03,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-Q_2023-05-03' --> 'data\processed_data\QCOM\10-Q_2023-05-03.md'


2025-11-14 17:31:03,856 - INFO - Going to convert document batch...
2025-11-14 17:31:03,857 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 17:31:04,443 - INFO - Finished converting document 10-Q_2023-08-02 in 0.88 sec.
2025-11-14 17:31:04,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-Q_2023-08-02' --> 'data\processed_data\QCOM\10-Q_2023-08-02.md'


2025-11-14 17:31:05,265 - INFO - Going to convert document batch...
2025-11-14 17:31:05,266 - INFO - Processing document 10-Q_2024-01-31
2025-11-14 17:31:05,750 - INFO - Finished converting document 10-Q_2024-01-31 in 1.00 sec.
2025-11-14 17:31:06,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-Q_2024-01-31' --> 'data\processed_data\QCOM\10-Q_2024-01-31.md'


2025-11-14 17:31:06,294 - INFO - Going to convert document batch...
2025-11-14 17:31:06,297 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 17:31:06,826 - INFO - Finished converting document 10-Q_2024-05-01 in 0.81 sec.
2025-11-14 17:31:07,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-Q_2024-05-01' --> 'data\processed_data\QCOM\10-Q_2024-05-01.md'


2025-11-14 17:31:07,671 - INFO - Going to convert document batch...
2025-11-14 17:31:07,672 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 17:31:08,221 - INFO - Finished converting document 10-Q_2024-07-31 in 1.09 sec.
2025-11-14 17:31:08,550 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-Q_2024-07-31' --> 'data\processed_data\QCOM\10-Q_2024-07-31.md'


2025-11-14 17:31:08,749 - INFO - Going to convert document batch...
2025-11-14 17:31:08,750 - INFO - Processing document 10-Q_2025-02-05
2025-11-14 17:31:09,220 - INFO - Finished converting document 10-Q_2025-02-05 in 0.70 sec.
2025-11-14 17:31:09,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-Q_2025-02-05' --> 'data\processed_data\QCOM\10-Q_2025-02-05.md'


2025-11-14 17:31:09,751 - INFO - Going to convert document batch...
2025-11-14 17:31:09,752 - INFO - Processing document 10-Q_2025-04-30
2025-11-14 17:31:10,303 - INFO - Finished converting document 10-Q_2025-04-30 in 0.81 sec.
2025-11-14 17:31:10,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\10-Q_2025-04-30' --> 'data\processed_data\QCOM\10-Q_2025-04-30.md'


2025-11-14 17:31:11,181 - INFO - Going to convert document batch...
2025-11-14 17:31:11,182 - INFO - Processing document 10-Q_2025-07-30
2025-11-14 17:31:11,723 - INFO - Finished converting document 10-Q_2025-07-30 in 0.81 sec.
2025-11-14 17:31:12,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,044 - INFO - Going to convert document batch...
2025-11-14 17:31:12,044 - INFO - Processing document 4_2023-01-04
2025-11-14 17:31:12,061 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 17:31:12,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,123 - INFO - Going to convert document batch...
2025-11-14 17:31:12,124 - INFO - Processing document 4_2023-02-07
2025-11-14 17:31:12,146 - INFO - Finished converting document 4_2023-02-07 in 0.06 sec.
2025-11-14 17:31:12,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,191 - INFO - Going to convert document batch...
2025-11-14 17:31:12,

Converted 'data\edgar_documents\QCOM\10-Q_2025-07-30' --> 'data\processed_data\QCOM\10-Q_2025-07-30.md'
Converted 'data\edgar_documents\QCOM\4_2023-01-04' --> 'data\processed_data\QCOM\4_2023-01-04.md'
Converted 'data\edgar_documents\QCOM\4_2023-02-07' --> 'data\processed_data\QCOM\4_2023-02-07.md'


2025-11-14 17:31:12,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,252 - INFO - Going to convert document batch...
2025-11-14 17:31:12,253 - INFO - Processing document 4_2023-02-24
2025-11-14 17:31:12,272 - INFO - Finished converting document 4_2023-02-24 in 0.03 sec.
2025-11-14 17:31:12,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,324 - INFO - Going to convert document batch...
2025-11-14 17:31:12,325 - INFO - Processing document 4_2023-03-10
2025-11-14 17:31:12,358 - INFO - Finished converting document 4_2023-03-10 in 0.06 sec.
2025-11-14 17:31:12,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,407 - INFO - Going to convert document batch...
2025-11-14 17:31:12,407 - INFO - Processing document 4_2023-03-13


Converted 'data\edgar_documents\QCOM\4_2023-02-17' --> 'data\processed_data\QCOM\4_2023-02-17.md'
Converted 'data\edgar_documents\QCOM\4_2023-02-24' --> 'data\processed_data\QCOM\4_2023-02-24.md'
Converted 'data\edgar_documents\QCOM\4_2023-03-10' --> 'data\processed_data\QCOM\4_2023-03-10.md'


2025-11-14 17:31:12,431 - INFO - Finished converting document 4_2023-03-13 in 0.05 sec.
2025-11-14 17:31:12,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,472 - INFO - Going to convert document batch...
2025-11-14 17:31:12,473 - INFO - Processing document 4_2023-04-03
2025-11-14 17:31:12,493 - INFO - Finished converting document 4_2023-04-03 in 0.03 sec.
2025-11-14 17:31:12,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,561 - INFO - Going to convert document batch...
2025-11-14 17:31:12,562 - INFO - Processing document 4_2023-04-14
2025-11-14 17:31:12,583 - INFO - Finished converting document 4_2023-04-14 in 0.06 sec.
2025-11-14 17:31:12,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,633 - INFO - Going to convert document batch...
2025-11-14 17:31:12,634 - INFO - Processing document 4_2023-05-22
2025-11-14 17:31:12,665 - INFO - Finished converting document 4_2023-05-22 in 0.05 sec.


Converted 'data\edgar_documents\QCOM\4_2023-03-13' --> 'data\processed_data\QCOM\4_2023-03-13.md'
Converted 'data\edgar_documents\QCOM\4_2023-04-03' --> 'data\processed_data\QCOM\4_2023-04-03.md'
Converted 'data\edgar_documents\QCOM\4_2023-04-14' --> 'data\processed_data\QCOM\4_2023-04-14.md'


2025-11-14 17:31:12,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,728 - INFO - Going to convert document batch...
2025-11-14 17:31:12,730 - INFO - Processing document 4_2023-07-03
2025-11-14 17:31:12,766 - INFO - Finished converting document 4_2023-07-03 in 0.06 sec.
2025-11-14 17:31:12,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,814 - INFO - Going to convert document batch...
2025-11-14 17:31:12,815 - INFO - Processing document 4_2023-08-11
2025-11-14 17:31:12,835 - INFO - Finished converting document 4_2023-08-11 in 0.03 sec.
2025-11-14 17:31:12,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,891 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\QCOM\4_2023-05-22' --> 'data\processed_data\QCOM\4_2023-05-22.md'
Converted 'data\edgar_documents\QCOM\4_2023-07-03' --> 'data\processed_data\QCOM\4_2023-07-03.md'
Converted 'data\edgar_documents\QCOM\4_2023-08-11' --> 'data\processed_data\QCOM\4_2023-08-11.md'


2025-11-14 17:31:12,891 - INFO - Processing document 4_2023-08-18
2025-11-14 17:31:12,908 - INFO - Finished converting document 4_2023-08-18 in 0.05 sec.
2025-11-14 17:31:12,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:12,949 - INFO - Going to convert document batch...
2025-11-14 17:31:12,950 - INFO - Processing document 4_2023-09-11
2025-11-14 17:31:12,969 - INFO - Finished converting document 4_2023-09-11 in 0.05 sec.
2025-11-14 17:31:12,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,007 - INFO - Going to convert document batch...
2025-11-14 17:31:13,008 - INFO - Processing document 4_2023-09-13
2025-11-14 17:31:13,028 - INFO - Finished converting document 4_2023-09-13 in 0.05 sec.
2025-11-14 17:31:13,076 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,086 - INFO - Going to convert document batch...
2025-11-14 17:31:13,087 - INFO - Processing document 4_2023-10-02
2025-11-14 17:31:13,111 - IN

Converted 'data\edgar_documents\QCOM\4_2023-08-18' --> 'data\processed_data\QCOM\4_2023-08-18.md'
Converted 'data\edgar_documents\QCOM\4_2023-09-11' --> 'data\processed_data\QCOM\4_2023-09-11.md'
Converted 'data\edgar_documents\QCOM\4_2023-09-13' --> 'data\processed_data\QCOM\4_2023-09-13.md'


2025-11-14 17:31:13,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,155 - INFO - Going to convert document batch...
2025-11-14 17:31:13,156 - INFO - Processing document 4_2023-10-11
2025-11-14 17:31:13,173 - INFO - Finished converting document 4_2023-10-11 in 0.03 sec.
2025-11-14 17:31:13,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,219 - INFO - Going to convert document batch...
2025-11-14 17:31:13,220 - INFO - Processing document 4_2023-11-02
2025-11-14 17:31:13,242 - INFO - Finished converting document 4_2023-11-02 in 0.05 sec.
2025-11-14 17:31:13,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,284 - INFO - Going to convert document batch...
2025-11-14 17:31:13,285 - INFO - Processing document 4_2023-11-09
2025-11-14 17:31:13,304 - INFO - Finished converting document 4_2023-11-09 in 0.03 sec.


Converted 'data\edgar_documents\QCOM\4_2023-10-02' --> 'data\processed_data\QCOM\4_2023-10-02.md'
Converted 'data\edgar_documents\QCOM\4_2023-10-11' --> 'data\processed_data\QCOM\4_2023-10-11.md'
Converted 'data\edgar_documents\QCOM\4_2023-11-02' --> 'data\processed_data\QCOM\4_2023-11-02.md'


2025-11-14 17:31:13,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,342 - INFO - Going to convert document batch...
2025-11-14 17:31:13,344 - INFO - Processing document 4_2023-11-13
2025-11-14 17:31:13,363 - INFO - Finished converting document 4_2023-11-13 in 0.03 sec.
2025-11-14 17:31:13,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,439 - INFO - Going to convert document batch...
2025-11-14 17:31:13,440 - INFO - Processing document 4_2023-11-21
2025-11-14 17:31:13,466 - INFO - Finished converting document 4_2023-11-21 in 0.06 sec.
2025-11-14 17:31:13,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,509 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\QCOM\4_2023-11-09' --> 'data\processed_data\QCOM\4_2023-11-09.md'
Converted 'data\edgar_documents\QCOM\4_2023-11-13' --> 'data\processed_data\QCOM\4_2023-11-13.md'
Converted 'data\edgar_documents\QCOM\4_2023-11-21' --> 'data\processed_data\QCOM\4_2023-11-21.md'


2025-11-14 17:31:13,510 - INFO - Processing document 4_2023-11-29
2025-11-14 17:31:13,530 - INFO - Finished converting document 4_2023-11-29 in 0.05 sec.
2025-11-14 17:31:13,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,572 - INFO - Going to convert document batch...
2025-11-14 17:31:13,573 - INFO - Processing document 4_2023-12-05
2025-11-14 17:31:13,592 - INFO - Finished converting document 4_2023-12-05 in 0.05 sec.
2025-11-14 17:31:13,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,653 - INFO - Going to convert document batch...
2025-11-14 17:31:13,654 - INFO - Processing document 4_2023-12-12
2025-11-14 17:31:13,672 - INFO - Finished converting document 4_2023-12-12 in 0.06 sec.
2025-11-14 17:31:13,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,712 - INFO - Going to convert document batch...
2025-11-14 17:31:13,713 - INFO - Processing document 4_2023-12-15
2025-11-14 17:31:13,737 - IN

Converted 'data\edgar_documents\QCOM\4_2023-11-29' --> 'data\processed_data\QCOM\4_2023-11-29.md'
Converted 'data\edgar_documents\QCOM\4_2023-12-05' --> 'data\processed_data\QCOM\4_2023-12-05.md'
Converted 'data\edgar_documents\QCOM\4_2023-12-12' --> 'data\processed_data\QCOM\4_2023-12-12.md'


2025-11-14 17:31:13,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,782 - INFO - Going to convert document batch...
2025-11-14 17:31:13,783 - INFO - Processing document 4_2023-12-18
2025-11-14 17:31:13,804 - INFO - Finished converting document 4_2023-12-18 in 0.03 sec.
2025-11-14 17:31:13,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,866 - INFO - Going to convert document batch...
2025-11-14 17:31:13,867 - INFO - Processing document 4_2024-01-03
2025-11-14 17:31:13,899 - INFO - Finished converting document 4_2024-01-03 in 0.06 sec.
2025-11-14 17:31:13,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:13,942 - INFO - Going to convert document batch...
2025-11-14 17:31:13,942 - INFO - Processing document 4_2024-01-11
2025-11-14 17:31:13,961 - INFO - Finished converting document 4_2024-01-11 in 0.03 sec.


Converted 'data\edgar_documents\QCOM\4_2023-12-15' --> 'data\processed_data\QCOM\4_2023-12-15.md'
Converted 'data\edgar_documents\QCOM\4_2023-12-18' --> 'data\processed_data\QCOM\4_2023-12-18.md'
Converted 'data\edgar_documents\QCOM\4_2024-01-03' --> 'data\processed_data\QCOM\4_2024-01-03.md'


2025-11-14 17:31:13,993 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:14,000 - INFO - Going to convert document batch...
2025-11-14 17:31:14,001 - INFO - Processing document 4_2024-01-19
2025-11-14 17:31:14,020 - INFO - Finished converting document 4_2024-01-19 in 0.03 sec.
2025-11-14 17:31:14,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:14,060 - INFO - Going to convert document batch...
2025-11-14 17:31:14,061 - INFO - Processing document 4_2024-01-23
2025-11-14 17:31:14,079 - INFO - Finished converting document 4_2024-01-23 in 0.05 sec.
2025-11-14 17:31:14,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:14,122 - INFO - Going to convert document batch...
2025-11-14 17:31:14,122 - INFO - Processing document 4_2024-02-21
2025-11-14 17:31:14,149 - INFO - Finished converting document 4_2024-02-21 in 0.05 sec.


Converted 'data\edgar_documents\QCOM\4_2024-01-11' --> 'data\processed_data\QCOM\4_2024-01-11.md'
Converted 'data\edgar_documents\QCOM\4_2024-01-19' --> 'data\processed_data\QCOM\4_2024-01-19.md'
Converted 'data\edgar_documents\QCOM\4_2024-01-23' --> 'data\processed_data\QCOM\4_2024-01-23.md'


2025-11-14 17:31:14,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\4_2024-02-21' --> 'data\processed_data\QCOM\4_2024-02-21.md'


2025-11-14 17:31:14,475 - INFO - Going to convert document batch...
2025-11-14 17:31:14,476 - INFO - Processing document 4_2024-03-01
2025-11-14 17:31:14,497 - INFO - Finished converting document 4_2024-03-01 in 0.33 sec.
2025-11-14 17:31:14,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:14,546 - INFO - Going to convert document batch...
2025-11-14 17:31:14,546 - INFO - Processing document 4_2024-03-05
2025-11-14 17:31:14,566 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 17:31:14,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:14,606 - INFO - Going to convert document batch...
2025-11-14 17:31:14,607 - INFO - Processing document 4_2024-03-07
2025-11-14 17:31:14,625 - INFO - Finished converting document 4_2024-03-07 in 0.05 sec.
2025-11-14 17:31:14,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:14,666 - INFO - Going to convert document batch...
2025-11-14 17:31:14,667 - 

Converted 'data\edgar_documents\QCOM\4_2024-03-01' --> 'data\processed_data\QCOM\4_2024-03-01.md'
Converted 'data\edgar_documents\QCOM\4_2024-03-05' --> 'data\processed_data\QCOM\4_2024-03-05.md'
Converted 'data\edgar_documents\QCOM\4_2024-03-07' --> 'data\processed_data\QCOM\4_2024-03-07.md'
Converted 'data\edgar_documents\QCOM\4_2024-03-08' --> 'data\processed_data\QCOM\4_2024-03-08.md'


2025-11-14 17:31:14,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:14,749 - INFO - Going to convert document batch...
2025-11-14 17:31:14,750 - INFO - Processing document 4_2024-03-11
2025-11-14 17:31:14,770 - INFO - Finished converting document 4_2024-03-11 in 0.05 sec.
2025-11-14 17:31:14,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:14,823 - INFO - Going to convert document batch...
2025-11-14 17:31:14,824 - INFO - Processing document 4_2024-04-01
2025-11-14 17:31:14,842 - INFO - Finished converting document 4_2024-04-01 in 0.05 sec.
2025-11-14 17:31:14,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:14,881 - INFO - Going to convert document batch...
2025-11-14 17:31:14,882 - INFO - Processing document 4_2024-04-02
2025-11-14 17:31:14,904 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 17:31:14,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\QCOM\4_2024-03-11' --> 'data\processed_data\QCOM\4_2024-03-11.md'
Converted 'data\edgar_documents\QCOM\4_2024-04-01' --> 'data\processed_data\QCOM\4_2024-04-01.md'
Converted 'data\edgar_documents\QCOM\4_2024-04-02' --> 'data\processed_data\QCOM\4_2024-04-02.md'
Converted 'data\edgar_documents\QCOM\4_2024-04-04' --> 'data\processed_data\QCOM\4_2024-04-04.md'


2025-11-14 17:31:15,012 - INFO - Going to convert document batch...
2025-11-14 17:31:15,013 - INFO - Processing document 4_2024-05-03
2025-11-14 17:31:15,034 - INFO - Finished converting document 4_2024-05-03 in 0.05 sec.
2025-11-14 17:31:15,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,079 - INFO - Going to convert document batch...
2025-11-14 17:31:15,080 - INFO - Processing document 4_2024-05-06
2025-11-14 17:31:15,098 - INFO - Finished converting document 4_2024-05-06 in 0.03 sec.
2025-11-14 17:31:15,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,137 - INFO - Going to convert document batch...
2025-11-14 17:31:15,139 - INFO - Processing document 4_2024-05-10
2025-11-14 17:31:15,157 - INFO - Finished converting document 4_2024-05-10 in 0.05 sec.
2025-11-14 17:31:15,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,195 - INFO - Going to convert document batch...
2025-11-14 17:31:15,196 - 

Converted 'data\edgar_documents\QCOM\4_2024-05-03' --> 'data\processed_data\QCOM\4_2024-05-03.md'
Converted 'data\edgar_documents\QCOM\4_2024-05-06' --> 'data\processed_data\QCOM\4_2024-05-06.md'
Converted 'data\edgar_documents\QCOM\4_2024-05-10' --> 'data\processed_data\QCOM\4_2024-05-10.md'
Converted 'data\edgar_documents\QCOM\4_2024-05-13' --> 'data\processed_data\QCOM\4_2024-05-13.md'


2025-11-14 17:31:15,253 - INFO - Processing document 4_2024-05-16
2025-11-14 17:31:15,271 - INFO - Finished converting document 4_2024-05-16 in 0.03 sec.
2025-11-14 17:31:15,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,313 - INFO - Going to convert document batch...
2025-11-14 17:31:15,314 - INFO - Processing document 4_2024-05-21
2025-11-14 17:31:15,334 - INFO - Finished converting document 4_2024-05-21 in 0.03 sec.
2025-11-14 17:31:15,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,379 - INFO - Going to convert document batch...
2025-11-14 17:31:15,380 - INFO - Processing document 4_2024-05-22
2025-11-14 17:31:15,409 - INFO - Finished converting document 4_2024-05-22 in 0.05 sec.
2025-11-14 17:31:15,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,477 - INFO - Going to convert document batch...
2025-11-14 17:31:15,478 - INFO - Processing document 4_2024-06-04
2025-11-14 17:31:15,498 - IN

Converted 'data\edgar_documents\QCOM\4_2024-05-16' --> 'data\processed_data\QCOM\4_2024-05-16.md'
Converted 'data\edgar_documents\QCOM\4_2024-05-21' --> 'data\processed_data\QCOM\4_2024-05-21.md'
Converted 'data\edgar_documents\QCOM\4_2024-05-22' --> 'data\processed_data\QCOM\4_2024-05-22.md'


2025-11-14 17:31:15,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,540 - INFO - Going to convert document batch...
2025-11-14 17:31:15,540 - INFO - Processing document 4_2024-07-01
2025-11-14 17:31:15,562 - INFO - Finished converting document 4_2024-07-01 in 0.05 sec.
2025-11-14 17:31:15,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,605 - INFO - Going to convert document batch...
2025-11-14 17:31:15,606 - INFO - Processing document 4_2024-07-02
2025-11-14 17:31:15,625 - INFO - Finished converting document 4_2024-07-02 in 0.05 sec.
2025-11-14 17:31:15,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\4_2024-06-04' --> 'data\processed_data\QCOM\4_2024-06-04.md'
Converted 'data\edgar_documents\QCOM\4_2024-07-01' --> 'data\processed_data\QCOM\4_2024-07-01.md'
Converted 'data\edgar_documents\QCOM\4_2024-07-02' --> 'data\processed_data\QCOM\4_2024-07-02.md'


2025-11-14 17:31:15,707 - INFO - Going to convert document batch...
2025-11-14 17:31:15,707 - INFO - Processing document 4_2024-07-08
2025-11-14 17:31:15,728 - INFO - Finished converting document 4_2024-07-08 in 0.05 sec.
2025-11-14 17:31:15,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,772 - INFO - Going to convert document batch...
2025-11-14 17:31:15,773 - INFO - Processing document 4_2024-08-05
2025-11-14 17:31:15,795 - INFO - Finished converting document 4_2024-08-05 in 0.05 sec.
2025-11-14 17:31:15,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,838 - INFO - Going to convert document batch...
2025-11-14 17:31:15,839 - INFO - Processing document 4_2024-08-09
2025-11-14 17:31:15,865 - INFO - Finished converting document 4_2024-08-09 in 0.05 sec.
2025-11-14 17:31:15,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,912 - INFO - Going to convert document batch...
2025-11-14 17:31:15,913 - 

Converted 'data\edgar_documents\QCOM\4_2024-07-08' --> 'data\processed_data\QCOM\4_2024-07-08.md'
Converted 'data\edgar_documents\QCOM\4_2024-08-05' --> 'data\processed_data\QCOM\4_2024-08-05.md'
Converted 'data\edgar_documents\QCOM\4_2024-08-09' --> 'data\processed_data\QCOM\4_2024-08-09.md'


2025-11-14 17:31:15,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:15,984 - INFO - Going to convert document batch...
2025-11-14 17:31:15,985 - INFO - Processing document 4_2024-09-04
2025-11-14 17:31:16,014 - INFO - Finished converting document 4_2024-09-04 in 0.06 sec.
2025-11-14 17:31:16,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,062 - INFO - Going to convert document batch...
2025-11-14 17:31:16,063 - INFO - Processing document 4_2024-09-06
2025-11-14 17:31:16,080 - INFO - Finished converting document 4_2024-09-06 in 0.03 sec.
2025-11-14 17:31:16,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,119 - INFO - Going to convert document batch...
2025-11-14 17:31:16,120 - INFO - Processing document 4_2024-10-01
2025-11-14 17:31:16,137 - INFO - Finished converting document 4_2024-10-01 in 0.05 sec.


Converted 'data\edgar_documents\QCOM\4_2024-08-21' --> 'data\processed_data\QCOM\4_2024-08-21.md'
Converted 'data\edgar_documents\QCOM\4_2024-09-04' --> 'data\processed_data\QCOM\4_2024-09-04.md'
Converted 'data\edgar_documents\QCOM\4_2024-09-06' --> 'data\processed_data\QCOM\4_2024-09-06.md'


2025-11-14 17:31:16,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,181 - INFO - Going to convert document batch...
2025-11-14 17:31:16,182 - INFO - Processing document 4_2024-10-02
2025-11-14 17:31:16,208 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.
2025-11-14 17:31:16,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,254 - INFO - Going to convert document batch...
2025-11-14 17:31:16,255 - INFO - Processing document 4_2024-10-09
2025-11-14 17:31:16,277 - INFO - Finished converting document 4_2024-10-09 in 0.05 sec.
2025-11-14 17:31:16,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,317 - INFO - Going to convert document batch...
2025-11-14 17:31:16,318 - INFO - Processing document 4_2024-10-10
2025-11-14 17:31:16,337 - INFO - Finished converting document 4_2024-10-10 in 0.03 sec.


Converted 'data\edgar_documents\QCOM\4_2024-10-01' --> 'data\processed_data\QCOM\4_2024-10-01.md'
Converted 'data\edgar_documents\QCOM\4_2024-10-02' --> 'data\processed_data\QCOM\4_2024-10-02.md'
Converted 'data\edgar_documents\QCOM\4_2024-10-09' --> 'data\processed_data\QCOM\4_2024-10-09.md'


2025-11-14 17:31:16,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,379 - INFO - Going to convert document batch...
2025-11-14 17:31:16,380 - INFO - Processing document 4_2024-11-04
2025-11-14 17:31:16,405 - INFO - Finished converting document 4_2024-11-04 in 0.05 sec.
2025-11-14 17:31:16,460 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,471 - INFO - Going to convert document batch...
2025-11-14 17:31:16,472 - INFO - Processing document 4_2024-11-12
2025-11-14 17:31:16,497 - INFO - Finished converting document 4_2024-11-12 in 0.06 sec.
2025-11-14 17:31:16,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,540 - INFO - Going to convert document batch...
2025-11-14 17:31:16,540 - INFO - Processing document 4_2024-11-15


Converted 'data\edgar_documents\QCOM\4_2024-10-10' --> 'data\processed_data\QCOM\4_2024-10-10.md'
Converted 'data\edgar_documents\QCOM\4_2024-11-04' --> 'data\processed_data\QCOM\4_2024-11-04.md'
Converted 'data\edgar_documents\QCOM\4_2024-11-12' --> 'data\processed_data\QCOM\4_2024-11-12.md'


2025-11-14 17:31:16,560 - INFO - Finished converting document 4_2024-11-15 in 0.05 sec.
2025-11-14 17:31:16,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,609 - INFO - Going to convert document batch...
2025-11-14 17:31:16,610 - INFO - Processing document 4_2024-11-21
2025-11-14 17:31:16,640 - INFO - Finished converting document 4_2024-11-21 in 0.06 sec.
2025-11-14 17:31:16,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,688 - INFO - Going to convert document batch...
2025-11-14 17:31:16,689 - INFO - Processing document 4_2024-12-06
2025-11-14 17:31:16,713 - INFO - Finished converting document 4_2024-12-06 in 0.05 sec.
2025-11-14 17:31:16,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,757 - INFO - Going to convert document batch...
2025-11-14 17:31:16,758 - INFO - Processing document 4_2024-12-10
2025-11-14 17:31:16,781 - INFO - Finished converting document 4_2024-12-10 in 0.05 sec.


Converted 'data\edgar_documents\QCOM\4_2024-11-15' --> 'data\processed_data\QCOM\4_2024-11-15.md'
Converted 'data\edgar_documents\QCOM\4_2024-11-21' --> 'data\processed_data\QCOM\4_2024-11-21.md'
Converted 'data\edgar_documents\QCOM\4_2024-12-06' --> 'data\processed_data\QCOM\4_2024-12-06.md'


2025-11-14 17:31:16,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,821 - INFO - Going to convert document batch...
2025-11-14 17:31:16,822 - INFO - Processing document 4_2024-12-11
2025-11-14 17:31:16,846 - INFO - Finished converting document 4_2024-12-11 in 0.05 sec.
2025-11-14 17:31:16,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:16,896 - INFO - Going to convert document batch...
2025-11-14 17:31:16,897 - INFO - Processing document 4_2024-12-16
2025-11-14 17:31:16,953 - INFO - Finished converting document 4_2024-12-16 in 0.08 sec.


Converted 'data\edgar_documents\QCOM\4_2024-12-10' --> 'data\processed_data\QCOM\4_2024-12-10.md'
Converted 'data\edgar_documents\QCOM\4_2024-12-11' --> 'data\processed_data\QCOM\4_2024-12-11.md'
Converted 'data\edgar_documents\QCOM\4_2024-12-16' --> 'data\processed_data\QCOM\4_2024-12-16.md'


2025-11-14 17:31:16,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,003 - INFO - Going to convert document batch...
2025-11-14 17:31:17,003 - INFO - Processing document 4_2025-01-02
2025-11-14 17:31:17,021 - INFO - Finished converting document 4_2025-01-02 in 0.03 sec.
2025-11-14 17:31:17,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,067 - INFO - Going to convert document batch...
2025-11-14 17:31:17,067 - INFO - Processing document 4_2025-01-03
2025-11-14 17:31:17,092 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 17:31:17,124 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,132 - INFO - Going to convert document batch...
2025-11-14 17:31:17,133 - INFO - Processing document 4_2025-02-10
2025-11-14 17:31:17,152 - INFO - Finished converting document 4_2025-02-10 in 0.05 sec.
2025-11-14 17:31:17,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\QCOM\4_2025-01-02' --> 'data\processed_data\QCOM\4_2025-01-02.md'
Converted 'data\edgar_documents\QCOM\4_2025-01-03' --> 'data\processed_data\QCOM\4_2025-01-03.md'
Converted 'data\edgar_documents\QCOM\4_2025-02-10' --> 'data\processed_data\QCOM\4_2025-02-10.md'
Converted 'data\edgar_documents\QCOM\4_2025-02-12' --> 'data\processed_data\QCOM\4_2025-02-12.md'


2025-11-14 17:31:17,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,256 - INFO - Going to convert document batch...
2025-11-14 17:31:17,256 - INFO - Processing document 4_2025-02-21
2025-11-14 17:31:17,280 - INFO - Finished converting document 4_2025-02-21 in 0.05 sec.
2025-11-14 17:31:17,314 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,327 - INFO - Going to convert document batch...
2025-11-14 17:31:17,327 - INFO - Processing document 4_2025-03-03
2025-11-14 17:31:17,355 - INFO - Finished converting document 4_2025-03-03 in 0.06 sec.
2025-11-14 17:31:17,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,400 - INFO - Going to convert document batch...
2025-11-14 17:31:17,401 - INFO - Processing document 4_2025-03-10
2025-11-14 17:31:17,427 - INFO - Finished converting document 4_2025-03-10 in 0.05 sec.
2025-11-14 17:31:17,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\QCOM\4_2025-02-21' --> 'data\processed_data\QCOM\4_2025-02-21.md'
Converted 'data\edgar_documents\QCOM\4_2025-03-03' --> 'data\processed_data\QCOM\4_2025-03-03.md'
Converted 'data\edgar_documents\QCOM\4_2025-03-10' --> 'data\processed_data\QCOM\4_2025-03-10.md'


2025-11-14 17:31:17,490 - INFO - Processing document 4_2025-03-12
2025-11-14 17:31:17,510 - INFO - Finished converting document 4_2025-03-12 in 0.08 sec.
2025-11-14 17:31:17,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,553 - INFO - Going to convert document batch...
2025-11-14 17:31:17,553 - INFO - Processing document 4_2025-03-20
2025-11-14 17:31:17,574 - INFO - Finished converting document 4_2025-03-20 in 0.05 sec.
2025-11-14 17:31:17,605 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,614 - INFO - Going to convert document batch...
2025-11-14 17:31:17,614 - INFO - Processing document 4_2025-04-01
2025-11-14 17:31:17,633 - INFO - Finished converting document 4_2025-04-01 in 0.03 sec.
2025-11-14 17:31:17,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,672 - INFO - Going to convert document batch...
2025-11-14 17:31:17,673 - INFO - Processing document 4_2025-04-07
2025-11-14 17:31:17,693 - IN

Converted 'data\edgar_documents\QCOM\4_2025-03-12' --> 'data\processed_data\QCOM\4_2025-03-12.md'
Converted 'data\edgar_documents\QCOM\4_2025-03-20' --> 'data\processed_data\QCOM\4_2025-03-20.md'
Converted 'data\edgar_documents\QCOM\4_2025-04-01' --> 'data\processed_data\QCOM\4_2025-04-01.md'


2025-11-14 17:31:17,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,736 - INFO - Going to convert document batch...
2025-11-14 17:31:17,737 - INFO - Processing document 4_2025-04-08
2025-11-14 17:31:17,764 - INFO - Finished converting document 4_2025-04-08 in 0.05 sec.
2025-11-14 17:31:17,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,839 - INFO - Going to convert document batch...
2025-11-14 17:31:17,839 - INFO - Processing document 4_2025-04-10
2025-11-14 17:31:17,869 - INFO - Finished converting document 4_2025-04-10 in 0.08 sec.
2025-11-14 17:31:17,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\4_2025-04-07' --> 'data\processed_data\QCOM\4_2025-04-07.md'
Converted 'data\edgar_documents\QCOM\4_2025-04-08' --> 'data\processed_data\QCOM\4_2025-04-08.md'
Converted 'data\edgar_documents\QCOM\4_2025-04-10' --> 'data\processed_data\QCOM\4_2025-04-10.md'


2025-11-14 17:31:17,916 - INFO - Going to convert document batch...
2025-11-14 17:31:17,917 - INFO - Processing document 4_2025-05-02
2025-11-14 17:31:17,935 - INFO - Finished converting document 4_2025-05-02 in 0.05 sec.
2025-11-14 17:31:17,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:17,981 - INFO - Going to convert document batch...
2025-11-14 17:31:17,982 - INFO - Processing document 4_2025-05-05
2025-11-14 17:31:18,013 - INFO - Finished converting document 4_2025-05-05 in 0.06 sec.
2025-11-14 17:31:18,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,064 - INFO - Going to convert document batch...
2025-11-14 17:31:18,064 - INFO - Processing document 4_2025-05-13
2025-11-14 17:31:18,083 - INFO - Finished converting document 4_2025-05-13 in 0.05 sec.
2025-11-14 17:31:18,154 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\QCOM\4_2025-05-02' --> 'data\processed_data\QCOM\4_2025-05-02.md'
Converted 'data\edgar_documents\QCOM\4_2025-05-05' --> 'data\processed_data\QCOM\4_2025-05-05.md'
Converted 'data\edgar_documents\QCOM\4_2025-05-13' --> 'data\processed_data\QCOM\4_2025-05-13.md'


2025-11-14 17:31:18,156 - ERROR - Input document 4_2025-05-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:31:18,159 - INFO - Going to convert document batch...
2025-11-14 17:31:18,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,185 - INFO - Going to convert document batch...
2025-11-14 17:31:18,186 - INFO - Processing document 4_2025-05-21


Error processing data\edgar_documents\QCOM\4_2025-05-19: File format not allowed: data\edgar_documents\QCOM\4_2025-05-19


2025-11-14 17:31:18,420 - INFO - Finished converting document 4_2025-05-21 in 0.27 sec.
2025-11-14 17:31:18,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,471 - INFO - Going to convert document batch...
2025-11-14 17:31:18,472 - INFO - Processing document 4_2025-05-28
2025-11-14 17:31:18,491 - INFO - Finished converting document 4_2025-05-28 in 0.05 sec.
2025-11-14 17:31:18,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,535 - INFO - Going to convert document batch...
2025-11-14 17:31:18,536 - INFO - Processing document 4_2025-06-02
2025-11-14 17:31:18,578 - INFO - Finished converting document 4_2025-06-02 in 0.06 sec.
2025-11-14 17:31:18,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,620 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\QCOM\4_2025-05-21' --> 'data\processed_data\QCOM\4_2025-05-21.md'
Converted 'data\edgar_documents\QCOM\4_2025-05-28' --> 'data\processed_data\QCOM\4_2025-05-28.md'
Converted 'data\edgar_documents\QCOM\4_2025-06-02' --> 'data\processed_data\QCOM\4_2025-06-02.md'


2025-11-14 17:31:18,622 - INFO - Processing document 4_2025-07-01
2025-11-14 17:31:18,644 - INFO - Finished converting document 4_2025-07-01 in 0.05 sec.
2025-11-14 17:31:18,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,690 - INFO - Going to convert document batch...
2025-11-14 17:31:18,691 - INFO - Processing document 4_2025-07-02
2025-11-14 17:31:18,715 - INFO - Finished converting document 4_2025-07-02 in 0.06 sec.
2025-11-14 17:31:18,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,756 - INFO - Going to convert document batch...
2025-11-14 17:31:18,757 - INFO - Processing document 4_2025-08-01
2025-11-14 17:31:18,777 - INFO - Finished converting document 4_2025-08-01 in 0.05 sec.
2025-11-14 17:31:18,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,823 - INFO - Going to convert document batch...
2025-11-14 17:31:18,823 - INFO - Processing document 4_2025-08-04
2025-11-14 17:31:18,846 - IN

Converted 'data\edgar_documents\QCOM\4_2025-07-01' --> 'data\processed_data\QCOM\4_2025-07-01.md'
Converted 'data\edgar_documents\QCOM\4_2025-07-02' --> 'data\processed_data\QCOM\4_2025-07-02.md'
Converted 'data\edgar_documents\QCOM\4_2025-08-01' --> 'data\processed_data\QCOM\4_2025-08-01.md'


2025-11-14 17:31:18,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,894 - INFO - Going to convert document batch...
2025-11-14 17:31:18,895 - INFO - Processing document 4_2025-08-21
2025-11-14 17:31:18,927 - INFO - Finished converting document 4_2025-08-21 in 0.06 sec.
2025-11-14 17:31:18,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:18,972 - INFO - Going to convert document batch...
2025-11-14 17:31:18,973 - INFO - Processing document 4_2025-08-27
2025-11-14 17:31:18,993 - INFO - Finished converting document 4_2025-08-27 in 0.03 sec.
2025-11-14 17:31:19,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,033 - INFO - Going to convert document batch...
2025-11-14 17:31:19,034 - INFO - Processing document 4_2025-09-02
2025-11-14 17:31:19,059 - INFO - Finished converting document 4_2025-09-02 in 0.05 sec.


Converted 'data\edgar_documents\QCOM\4_2025-08-04' --> 'data\processed_data\QCOM\4_2025-08-04.md'
Converted 'data\edgar_documents\QCOM\4_2025-08-21' --> 'data\processed_data\QCOM\4_2025-08-21.md'
Converted 'data\edgar_documents\QCOM\4_2025-08-27' --> 'data\processed_data\QCOM\4_2025-08-27.md'


2025-11-14 17:31:19,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,102 - INFO - Going to convert document batch...
2025-11-14 17:31:19,103 - INFO - Processing document 4_2025-09-15
2025-11-14 17:31:19,123 - INFO - Finished converting document 4_2025-09-15 in 0.05 sec.
2025-11-14 17:31:19,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,190 - INFO - Going to convert document batch...
2025-11-14 17:31:19,191 - INFO - Processing document 4_2025-09-23
2025-11-14 17:31:19,220 - INFO - Finished converting document 4_2025-09-23 in 0.08 sec.
2025-11-14 17:31:19,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\QCOM\4_2025-09-02' --> 'data\processed_data\QCOM\4_2025-09-02.md'
Converted 'data\edgar_documents\QCOM\4_2025-09-15' --> 'data\processed_data\QCOM\4_2025-09-15.md'
Converted 'data\edgar_documents\QCOM\4_2025-09-23' --> 'data\processed_data\QCOM\4_2025-09-23.md'


2025-11-14 17:31:19,280 - INFO - Going to convert document batch...
2025-11-14 17:31:19,281 - INFO - Processing document 4_2025-10-01
2025-11-14 17:31:19,300 - INFO - Finished converting document 4_2025-10-01 in 0.05 sec.
2025-11-14 17:31:19,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,344 - INFO - Going to convert document batch...
2025-11-14 17:31:19,345 - INFO - Processing document 4_2025-10-03
2025-11-14 17:31:19,368 - INFO - Finished converting document 4_2025-10-03 in 0.05 sec.
2025-11-14 17:31:19,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,435 - INFO - Going to convert document batch...
2025-11-14 17:31:19,436 - INFO - Processing document 4_2025-10-16
2025-11-14 17:31:19,461 - INFO - Finished converting document 4_2025-10-16 in 0.06 sec.


Converted 'data\edgar_documents\QCOM\4_2025-10-01' --> 'data\processed_data\QCOM\4_2025-10-01.md'
Converted 'data\edgar_documents\QCOM\4_2025-10-03' --> 'data\processed_data\QCOM\4_2025-10-03.md'
Converted 'data\edgar_documents\QCOM\4_2025-10-16' --> 'data\processed_data\QCOM\4_2025-10-16.md'


2025-11-14 17:31:19,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,510 - INFO - Going to convert document batch...
2025-11-14 17:31:19,511 - INFO - Processing document 4_2025-10-20
2025-11-14 17:31:19,536 - INFO - Finished converting document 4_2025-10-20 in 0.05 sec.
2025-11-14 17:31:19,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,583 - INFO - Going to convert document batch...
2025-11-14 17:31:19,584 - INFO - Processing document 4_2025-10-27
2025-11-14 17:31:19,602 - INFO - Finished converting document 4_2025-10-27 in 0.03 sec.
2025-11-14 17:31:19,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,641 - INFO - Going to convert document batch...
2025-11-14 17:31:19,642 - INFO - Processing document 4_2025-10-31
2025-11-14 17:31:19,661 - INFO - Finished converting document 4_2025-10-31 in 0.03 sec.
2025-11-14 17:31:19,707 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\QCOM\4_2025-10-20' --> 'data\processed_data\QCOM\4_2025-10-20.md'
Converted 'data\edgar_documents\QCOM\4_2025-10-27' --> 'data\processed_data\QCOM\4_2025-10-27.md'
Converted 'data\edgar_documents\QCOM\4_2025-10-31' --> 'data\processed_data\QCOM\4_2025-10-31.md'


2025-11-14 17:31:19,753 - INFO - Finished converting document 4_2025-11-10 in 0.08 sec.
2025-11-14 17:31:19,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,828 - INFO - Going to convert document batch...
2025-11-14 17:31:19,830 - INFO - Processing document 8-K_2023-02-02
2025-11-14 17:31:19,857 - INFO - Finished converting document 8-K_2023-02-02 in 0.08 sec.
2025-11-14 17:31:19,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,899 - INFO - Going to convert document batch...
2025-11-14 17:31:19,900 - INFO - Processing document 8-K_2023-03-09
2025-11-14 17:31:19,929 - INFO - Finished converting document 8-K_2023-03-09 in 0.05 sec.


Converted 'data\edgar_documents\QCOM\4_2025-11-10' --> 'data\processed_data\QCOM\4_2025-11-10.md'
Converted 'data\edgar_documents\QCOM\8-K_2023-02-02' --> 'data\processed_data\QCOM\8-K_2023-02-02.md'
Converted 'data\edgar_documents\QCOM\8-K_2023-03-09' --> 'data\processed_data\QCOM\8-K_2023-03-09.md'


2025-11-14 17:31:19,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:19,993 - INFO - Going to convert document batch...
2025-11-14 17:31:19,993 - INFO - Processing document 8-K_2023-05-03
2025-11-14 17:31:20,009 - INFO - Finished converting document 8-K_2023-05-03 in 0.06 sec.
2025-11-14 17:31:20,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,046 - INFO - Going to convert document batch...
2025-11-14 17:31:20,046 - INFO - Processing document 8-K_2023-07-21
2025-11-14 17:31:20,065 - INFO - Finished converting document 8-K_2023-07-21 in 0.05 sec.
2025-11-14 17:31:20,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,099 - INFO - Going to convert document batch...
2025-11-14 17:31:20,100 - INFO - Processing document 8-K_2023-08-02
2025-11-14 17:31:20,116 - INFO - Finished converting document 8-K_2023-08-02 in 0.03 sec.
2025-11-14 17:31:20,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\QCOM\8-K_2023-05-03' --> 'data\processed_data\QCOM\8-K_2023-05-03.md'
Converted 'data\edgar_documents\QCOM\8-K_2023-07-21' --> 'data\processed_data\QCOM\8-K_2023-07-21.md'
Converted 'data\edgar_documents\QCOM\8-K_2023-08-02' --> 'data\processed_data\QCOM\8-K_2023-08-02.md'
Converted 'data\edgar_documents\QCOM\8-K_2023-11-01' --> 'data\processed_data\QCOM\8-K_2023-11-01.md'


2025-11-14 17:31:20,198 - INFO - Processing document 8-K_2024-01-23
2025-11-14 17:31:20,211 - INFO - Finished converting document 8-K_2024-01-23 in 0.03 sec.
2025-11-14 17:31:20,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,242 - INFO - Going to convert document batch...
2025-11-14 17:31:20,243 - INFO - Processing document 8-K_2024-01-31
2025-11-14 17:31:20,263 - INFO - Finished converting document 8-K_2024-01-31 in 0.05 sec.
2025-11-14 17:31:20,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,324 - INFO - Going to convert document batch...
2025-11-14 17:31:20,326 - INFO - Processing document 8-K_2024-03-07
2025-11-14 17:31:20,391 - INFO - Finished converting document 8-K_2024-03-07 in 0.12 sec.


Converted 'data\edgar_documents\QCOM\8-K_2024-01-23' --> 'data\processed_data\QCOM\8-K_2024-01-23.md'
Converted 'data\edgar_documents\QCOM\8-K_2024-01-31' --> 'data\processed_data\QCOM\8-K_2024-01-31.md'


2025-11-14 17:31:20,432 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,441 - INFO - Going to convert document batch...
2025-11-14 17:31:20,442 - INFO - Processing document 8-K_2024-05-01
2025-11-14 17:31:20,460 - INFO - Finished converting document 8-K_2024-05-01 in 0.03 sec.
2025-11-14 17:31:20,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,493 - INFO - Going to convert document batch...
2025-11-14 17:31:20,493 - INFO - Processing document 8-K_2024-05-09
2025-11-14 17:31:20,511 - INFO - Finished converting document 8-K_2024-05-09 in 0.05 sec.
2025-11-14 17:31:20,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,544 - INFO - Going to convert document batch...
2025-11-14 17:31:20,544 - INFO - Processing document 8-K_2024-07-31
2025-11-14 17:31:20,563 - INFO - Finished converting document 8-K_2024-07-31 in 0.05 sec.
2025-11-14 17:31:20,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\QCOM\8-K_2024-03-07' --> 'data\processed_data\QCOM\8-K_2024-03-07.md'
Converted 'data\edgar_documents\QCOM\8-K_2024-05-01' --> 'data\processed_data\QCOM\8-K_2024-05-01.md'
Converted 'data\edgar_documents\QCOM\8-K_2024-05-09' --> 'data\processed_data\QCOM\8-K_2024-05-09.md'
Converted 'data\edgar_documents\QCOM\8-K_2024-07-31' --> 'data\processed_data\QCOM\8-K_2024-07-31.md'


2025-11-14 17:31:20,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,648 - INFO - Going to convert document batch...
2025-11-14 17:31:20,649 - INFO - Processing document 8-K_2024-10-09
2025-11-14 17:31:20,667 - INFO - Finished converting document 8-K_2024-10-09 in 0.05 sec.
2025-11-14 17:31:20,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,698 - INFO - Going to convert document batch...
2025-11-14 17:31:20,699 - INFO - Processing document 8-K_2024-11-06
2025-11-14 17:31:20,717 - INFO - Finished converting document 8-K_2024-11-06 in 0.05 sec.
2025-11-14 17:31:20,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,763 - INFO - Going to convert document batch...
2025-11-14 17:31:20,764 - INFO - Processing document 8-K_2024-12-12
2025-11-14 17:31:20,780 - INFO - Finished converting document 8-K_2024-12-12 in 0.06 sec.
2025-11-14 17:31:20,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\QCOM\8-K_2024-08-09' --> 'data\processed_data\QCOM\8-K_2024-08-09.md'
Converted 'data\edgar_documents\QCOM\8-K_2024-10-09' --> 'data\processed_data\QCOM\8-K_2024-10-09.md'
Converted 'data\edgar_documents\QCOM\8-K_2024-11-06' --> 'data\processed_data\QCOM\8-K_2024-11-06.md'
Converted 'data\edgar_documents\QCOM\8-K_2024-12-12' --> 'data\processed_data\QCOM\8-K_2024-12-12.md'


2025-11-14 17:31:20,809 - INFO - Processing document 8-K_2025-02-05
2025-11-14 17:31:20,827 - INFO - Finished converting document 8-K_2025-02-05 in 0.05 sec.
2025-11-14 17:31:20,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,866 - INFO - Going to convert document batch...
2025-11-14 17:31:20,868 - INFO - Processing document 8-K_2025-03-20
2025-11-14 17:31:20,898 - INFO - Finished converting document 8-K_2025-03-20 in 0.06 sec.
2025-11-14 17:31:20,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,937 - INFO - Going to convert document batch...
2025-11-14 17:31:20,938 - INFO - Processing document 8-K_2025-04-30
2025-11-14 17:31:20,960 - INFO - Finished converting document 8-K_2025-04-30 in 0.05 sec.
2025-11-14 17:31:20,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:20,993 - INFO - Going to convert document batch...
2025-11-14 17:31:20,994 - INFO - Processing document 8-K_2025-05-13
2025-11-14 17:

Converted 'data\edgar_documents\QCOM\8-K_2025-02-05' --> 'data\processed_data\QCOM\8-K_2025-02-05.md'
Converted 'data\edgar_documents\QCOM\8-K_2025-03-20' --> 'data\processed_data\QCOM\8-K_2025-03-20.md'
Converted 'data\edgar_documents\QCOM\8-K_2025-04-30' --> 'data\processed_data\QCOM\8-K_2025-04-30.md'


2025-11-14 17:31:21,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:21,055 - INFO - Going to convert document batch...
2025-11-14 17:31:21,056 - INFO - Processing document 8-K_2025-05-22
2025-11-14 17:31:21,092 - INFO - Finished converting document 8-K_2025-05-22 in 0.06 sec.
2025-11-14 17:31:21,167 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:21,181 - INFO - Going to convert document batch...
2025-11-14 17:31:21,182 - INFO - Processing document 8-K_2025-06-09
2025-11-14 17:31:21,201 - INFO - Finished converting document 8-K_2025-06-09 in 0.06 sec.


Converted 'data\edgar_documents\QCOM\8-K_2025-05-13' --> 'data\processed_data\QCOM\8-K_2025-05-13.md'
Converted 'data\edgar_documents\QCOM\8-K_2025-05-22' --> 'data\processed_data\QCOM\8-K_2025-05-22.md'


2025-11-14 17:31:21,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:21,247 - INFO - Going to convert document batch...
2025-11-14 17:31:21,248 - INFO - Processing document 8-K_2025-07-30
2025-11-14 17:31:21,268 - INFO - Finished converting document 8-K_2025-07-30 in 0.05 sec.
2025-11-14 17:31:21,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:21,303 - INFO - Going to convert document batch...
2025-11-14 17:31:21,303 - INFO - Processing document 8-K_2025-08-25
2025-11-14 17:31:21,320 - INFO - Finished converting document 8-K_2025-08-25 in 0.03 sec.
2025-11-14 17:31:21,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:21,351 - INFO - Going to convert document batch...
2025-11-14 17:31:21,351 - INFO - Processing document 8-K_2025-09-02
2025-11-14 17:31:21,370 - INFO - Finished converting document 8-K_2025-09-02 in 0.05 sec.
2025-11-14 17:31:21,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\QCOM\8-K_2025-06-09' --> 'data\processed_data\QCOM\8-K_2025-06-09.md'
Converted 'data\edgar_documents\QCOM\8-K_2025-07-30' --> 'data\processed_data\QCOM\8-K_2025-07-30.md'
Converted 'data\edgar_documents\QCOM\8-K_2025-08-25' --> 'data\processed_data\QCOM\8-K_2025-08-25.md'
Converted 'data\edgar_documents\QCOM\8-K_2025-09-02' --> 'data\processed_data\QCOM\8-K_2025-09-02.md'


2025-11-14 17:31:21,402 - INFO - Processing document 8-K_2025-11-05
2025-11-14 17:31:21,421 - INFO - Finished converting document 8-K_2025-11-05 in 0.05 sec.
2025-11-14 17:31:21,508 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:31:21,509 - ERROR - Input document DEF-14A_2023-01-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:31:21,514 - INFO - Going to convert document batch...
2025-11-14 17:31:21,581 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>

Converted 'data\edgar_documents\QCOM\8-K_2025-11-05' --> 'data\processed_data\QCOM\8-K_2025-11-05.md'
Error processing data\edgar_documents\QCOM\DEF-14A_2023-01-19: File format not allowed: data\edgar_documents\QCOM\DEF-14A_2023-01-19
Error processing data\edgar_documents\QCOM\DEF-14A_2024-01-18: File format not allowed: data\edgar_documents\QCOM\DEF-14A_2024-01-18


2025-11-14 17:31:21,646 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:31:21,646 - ERROR - Input document DEF-14A_2025-01-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:31:21,649 - INFO - Going to convert document batch...
2025-11-14 17:31:21,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\QCOM\DEF-14A_2025-01-23: File format not allowed: data\edgar_documents\QCOM\DEF-14A_2025-01-23
Processed 138 new files. Errors: 5
Found 99 files to process in data\edgar_documents\RTX


2025-11-14 17:31:22,863 - INFO - Going to convert document batch...
2025-11-14 17:31:22,864 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:31:22,864 - INFO - Processing document 10-K_2023-02-07
2025-11-14 17:31:25,478 - INFO - Finished converting document 10-K_2023-02-07 in 3.81 sec.
2025-11-14 17:31:26,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-K_2023-02-07' --> 'data\processed_data\RTX\10-K_2023-02-07.md'


2025-11-14 17:31:27,420 - INFO - Going to convert document batch...
2025-11-14 17:31:27,422 - INFO - Processing document 10-K_2024-02-05
2025-11-14 17:31:29,323 - INFO - Finished converting document 10-K_2024-02-05 in 3.06 sec.
2025-11-14 17:31:30,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-K_2024-02-05' --> 'data\processed_data\RTX\10-K_2024-02-05.md'


2025-11-14 17:31:31,393 - INFO - Going to convert document batch...
2025-11-14 17:31:31,394 - INFO - Processing document 10-K_2025-02-03
2025-11-14 17:31:33,291 - INFO - Finished converting document 10-K_2025-02-03 in 3.28 sec.
2025-11-14 17:31:34,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-K_2025-02-03' --> 'data\processed_data\RTX\10-K_2025-02-03.md'


2025-11-14 17:31:34,468 - INFO - Going to convert document batch...
2025-11-14 17:31:34,469 - INFO - Processing document 10-Q_2023-04-25
2025-11-14 17:31:35,274 - INFO - Finished converting document 10-Q_2023-04-25 in 1.28 sec.
2025-11-14 17:31:35,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-Q_2023-04-25' --> 'data\processed_data\RTX\10-Q_2023-04-25.md'


2025-11-14 17:31:36,709 - INFO - Going to convert document batch...
2025-11-14 17:31:36,710 - INFO - Processing document 10-Q_2023-07-25
2025-11-14 17:31:37,819 - INFO - Finished converting document 10-Q_2023-07-25 in 2.17 sec.
2025-11-14 17:31:38,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-Q_2023-07-25' --> 'data\processed_data\RTX\10-Q_2023-07-25.md'


2025-11-14 17:31:39,261 - INFO - Going to convert document batch...
2025-11-14 17:31:39,262 - INFO - Processing document 10-Q_2023-10-24
2025-11-14 17:31:40,336 - INFO - Finished converting document 10-Q_2023-10-24 in 2.02 sec.
2025-11-14 17:31:40,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-Q_2023-10-24' --> 'data\processed_data\RTX\10-Q_2023-10-24.md'


2025-11-14 17:31:41,256 - INFO - Going to convert document batch...
2025-11-14 17:31:41,257 - INFO - Processing document 10-Q_2024-04-23
2025-11-14 17:31:42,034 - INFO - Finished converting document 10-Q_2024-04-23 in 1.19 sec.
2025-11-14 17:31:42,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-Q_2024-04-23' --> 'data\processed_data\RTX\10-Q_2024-04-23.md'


2025-11-14 17:31:43,362 - INFO - Going to convert document batch...
2025-11-14 17:31:43,363 - INFO - Processing document 10-Q_2024-07-25
2025-11-14 17:31:44,377 - INFO - Finished converting document 10-Q_2024-07-25 in 2.00 sec.
2025-11-14 17:31:44,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-Q_2024-07-25' --> 'data\processed_data\RTX\10-Q_2024-07-25.md'


2025-11-14 17:31:45,711 - INFO - Going to convert document batch...
2025-11-14 17:31:45,712 - INFO - Processing document 10-Q_2024-10-22
2025-11-14 17:31:46,757 - INFO - Finished converting document 10-Q_2024-10-22 in 1.91 sec.
2025-11-14 17:31:47,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-Q_2024-10-22' --> 'data\processed_data\RTX\10-Q_2024-10-22.md'


2025-11-14 17:31:47,835 - INFO - Going to convert document batch...
2025-11-14 17:31:47,835 - INFO - Processing document 10-Q_2025-04-22
2025-11-14 17:31:49,012 - INFO - Finished converting document 10-Q_2025-04-22 in 1.66 sec.
2025-11-14 17:31:49,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-Q_2025-04-22' --> 'data\processed_data\RTX\10-Q_2025-04-22.md'


2025-11-14 17:31:49,968 - INFO - Going to convert document batch...
2025-11-14 17:31:49,969 - INFO - Processing document 10-Q_2025-07-22
2025-11-14 17:31:51,003 - INFO - Finished converting document 10-Q_2025-07-22 in 1.61 sec.
2025-11-14 17:31:51,601 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-Q_2025-07-22' --> 'data\processed_data\RTX\10-Q_2025-07-22.md'


2025-11-14 17:31:52,600 - INFO - Going to convert document batch...
2025-11-14 17:31:52,600 - INFO - Processing document 10-Q_2025-10-21
2025-11-14 17:31:53,639 - INFO - Finished converting document 10-Q_2025-10-21 in 2.16 sec.
2025-11-14 17:31:54,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:54,138 - INFO - Going to convert document batch...
2025-11-14 17:31:54,139 - INFO - Processing document 4_2023-01-18
2025-11-14 17:31:54,159 - INFO - Finished converting document 4_2023-01-18 in 0.06 sec.
2025-11-14 17:31:54,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:54,229 - INFO - Going to convert document batch...
2025-11-14 17:31:54,229 - INFO - Processing document 4_2023-01-31
2025-11-14 17:31:54,250 - INFO - Finished converting document 4_2023-01-31 in 0.06 sec.
2025-11-14 17:31:54,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\10-Q_2025-10-21' --> 'data\processed_data\RTX\10-Q_2025-10-21.md'
Converted 'data\edgar_documents\RTX\4_2023-01-18' --> 'data\processed_data\RTX\4_2023-01-18.md'
Converted 'data\edgar_documents\RTX\4_2023-01-31' --> 'data\processed_data\RTX\4_2023-01-31.md'


2025-11-14 17:31:54,314 - INFO - Going to convert document batch...
2025-11-14 17:31:54,315 - INFO - Processing document 4_2023-02-07
2025-11-14 17:31:54,336 - INFO - Finished converting document 4_2023-02-07 in 0.06 sec.
2025-11-14 17:31:54,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:54,376 - INFO - Going to convert document batch...
2025-11-14 17:31:54,376 - INFO - Processing document 4_2023-02-10
2025-11-14 17:31:54,409 - INFO - Finished converting document 4_2023-02-10 in 0.05 sec.
2025-11-14 17:31:54,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:54,459 - INFO - Going to convert document batch...
2025-11-14 17:31:54,460 - INFO - Processing document 4_2023-02-16
2025-11-14 17:31:54,485 - INFO - Finished converting document 4_2023-02-16 in 0.05 sec.
2025-11-14 17:31:54,528 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:31:54,528 - ERROR - Input document 4_2023-02-23 with format None does 

Converted 'data\edgar_documents\RTX\4_2023-02-07' --> 'data\processed_data\RTX\4_2023-02-07.md'
Converted 'data\edgar_documents\RTX\4_2023-02-10' --> 'data\processed_data\RTX\4_2023-02-10.md'
Converted 'data\edgar_documents\RTX\4_2023-02-16' --> 'data\processed_data\RTX\4_2023-02-16.md'
Error processing data\edgar_documents\RTX\4_2023-02-23: File format not allowed: data\edgar_documents\RTX\4_2023-02-23


2025-11-14 17:31:54,553 - ERROR - Input document 4_2023-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:31:54,554 - INFO - Going to convert document batch...
2025-11-14 17:31:54,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:54,575 - INFO - Going to convert document batch...
2025-11-14 17:31:54,575 - INFO - Processing document 4_2023-03-02
2025-11-14 17:31:54,593 - INFO - Finished converting document 4_2023-03-02 in 0.05 sec.
2025-11-14 17:31:54,662 - INFO - detec

Error processing data\edgar_documents\RTX\4_2023-02-27: File format not allowed: data\edgar_documents\RTX\4_2023-02-27
Converted 'data\edgar_documents\RTX\4_2023-03-02' --> 'data\processed_data\RTX\4_2023-03-02.md'
Converted 'data\edgar_documents\RTX\4_2023-03-22' --> 'data\processed_data\RTX\4_2023-03-22.md'


2025-11-14 17:31:54,741 - INFO - Going to convert document batch...
2025-11-14 17:31:54,741 - INFO - Processing document 4_2023-03-28
2025-11-14 17:31:54,762 - INFO - Finished converting document 4_2023-03-28 in 0.05 sec.
2025-11-14 17:31:54,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:54,811 - INFO - Going to convert document batch...
2025-11-14 17:31:54,813 - INFO - Processing document 4_2023-05-04
2025-11-14 17:31:54,835 - INFO - Finished converting document 4_2023-05-04 in 0.05 sec.
2025-11-14 17:31:54,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:54,880 - INFO - Going to convert document batch...
2025-11-14 17:31:54,882 - INFO - Processing document 4_2023-07-27
2025-11-14 17:31:54,901 - INFO - Finished converting document 4_2023-07-27 in 0.05 sec.
2025-11-14 17:31:54,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:54,942 - INFO - Going to convert document batch...
2025-11-14 17:31:54,943 - 

Converted 'data\edgar_documents\RTX\4_2023-03-28' --> 'data\processed_data\RTX\4_2023-03-28.md'
Converted 'data\edgar_documents\RTX\4_2023-05-04' --> 'data\processed_data\RTX\4_2023-05-04.md'
Converted 'data\edgar_documents\RTX\4_2023-07-27' --> 'data\processed_data\RTX\4_2023-07-27.md'


2025-11-14 17:31:55,018 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:31:55,019 - ERROR - Input document 4_2023-11-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:31:55,021 - INFO - Going to convert document batch...
2025-11-14 17:31:55,051 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:31:55,052 - ERROR - Input document 4_2023-11-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\RTX\4_2023-10-04' --> 'data\processed_data\RTX\4_2023-10-04.md'
Error processing data\edgar_documents\RTX\4_2023-11-06: File format not allowed: data\edgar_documents\RTX\4_2023-11-06
Error processing data\edgar_documents\RTX\4_2023-11-08: File format not allowed: data\edgar_documents\RTX\4_2023-11-08
Converted 'data\edgar_documents\RTX\4_2023-12-18' --> 'data\processed_data\RTX\4_2023-12-18.md'


2025-11-14 17:31:55,173 - INFO - Processing document 4_2024-01-04
2025-11-14 17:31:55,192 - INFO - Finished converting document 4_2024-01-04 in 0.03 sec.
2025-11-14 17:31:55,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:55,237 - INFO - Going to convert document batch...
2025-11-14 17:31:55,238 - INFO - Processing document 4_2024-02-08
2025-11-14 17:31:55,265 - INFO - Finished converting document 4_2024-02-08 in 0.05 sec.
2025-11-14 17:31:55,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:55,314 - INFO - Going to convert document batch...
2025-11-14 17:31:55,315 - INFO - Processing document 4_2024-02-12
2025-11-14 17:31:55,349 - INFO - Finished converting document 4_2024-02-12 in 0.06 sec.
2025-11-14 17:31:55,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:55,399 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\RTX\4_2024-01-04' --> 'data\processed_data\RTX\4_2024-01-04.md'
Converted 'data\edgar_documents\RTX\4_2024-02-08' --> 'data\processed_data\RTX\4_2024-02-08.md'
Converted 'data\edgar_documents\RTX\4_2024-02-12' --> 'data\processed_data\RTX\4_2024-02-12.md'


2025-11-14 17:31:55,401 - INFO - Processing document 4_2024-02-15
2025-11-14 17:31:55,425 - INFO - Finished converting document 4_2024-02-15 in 0.05 sec.
2025-11-14 17:31:55,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:55,483 - INFO - Going to convert document batch...
2025-11-14 17:31:55,483 - INFO - Processing document 4_2024-02-20
2025-11-14 17:31:55,515 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.
2025-11-14 17:31:55,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:55,604 - INFO - Going to convert document batch...
2025-11-14 17:31:55,605 - INFO - Processing document 4_2024-03-12
2025-11-14 17:31:55,644 - INFO - Finished converting document 4_2024-03-12 in 0.09 sec.


Converted 'data\edgar_documents\RTX\4_2024-02-15' --> 'data\processed_data\RTX\4_2024-02-15.md'
Converted 'data\edgar_documents\RTX\4_2024-02-20' --> 'data\processed_data\RTX\4_2024-02-20.md'


2025-11-14 17:31:55,680 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:55,689 - INFO - Going to convert document batch...
2025-11-14 17:31:55,690 - INFO - Processing document 4_2024-03-27
2025-11-14 17:31:55,714 - INFO - Finished converting document 4_2024-03-27 in 0.05 sec.
2025-11-14 17:31:55,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:55,785 - INFO - Going to convert document batch...
2025-11-14 17:31:55,785 - INFO - Processing document 4_2024-04-29
2025-11-14 17:31:55,824 - INFO - Finished converting document 4_2024-04-29 in 0.09 sec.
2025-11-14 17:31:55,866 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\4_2024-03-12' --> 'data\processed_data\RTX\4_2024-03-12.md'
Converted 'data\edgar_documents\RTX\4_2024-03-27' --> 'data\processed_data\RTX\4_2024-03-27.md'
Converted 'data\edgar_documents\RTX\4_2024-04-29' --> 'data\processed_data\RTX\4_2024-04-29.md'


2025-11-14 17:31:55,876 - INFO - Going to convert document batch...
2025-11-14 17:31:55,877 - INFO - Processing document 4_2024-04-30
2025-11-14 17:31:55,901 - INFO - Finished converting document 4_2024-04-30 in 0.06 sec.
2025-11-14 17:31:55,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:55,950 - INFO - Going to convert document batch...
2025-11-14 17:31:55,951 - INFO - Processing document 4_2024-05-02
2025-11-14 17:31:55,974 - INFO - Finished converting document 4_2024-05-02 in 0.05 sec.
2025-11-14 17:31:56,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:56,016 - INFO - Going to convert document batch...
2025-11-14 17:31:56,017 - INFO - Processing document 4_2024-05-06
2025-11-14 17:31:56,039 - INFO - Finished converting document 4_2024-05-06 in 0.03 sec.
2025-11-14 17:31:56,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:56,108 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\RTX\4_2024-04-30' --> 'data\processed_data\RTX\4_2024-04-30.md'
Converted 'data\edgar_documents\RTX\4_2024-05-02' --> 'data\processed_data\RTX\4_2024-05-02.md'
Converted 'data\edgar_documents\RTX\4_2024-05-06' --> 'data\processed_data\RTX\4_2024-05-06.md'


2025-11-14 17:31:56,109 - INFO - Processing document 4_2024-05-14
2025-11-14 17:31:56,145 - INFO - Finished converting document 4_2024-05-14 in 0.08 sec.
2025-11-14 17:31:56,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:56,201 - INFO - Going to convert document batch...
2025-11-14 17:31:56,204 - INFO - Processing document 4_2024-07-30
2025-11-14 17:31:56,235 - INFO - Finished converting document 4_2024-07-30 in 0.06 sec.
2025-11-14 17:31:56,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:56,284 - INFO - Going to convert document batch...
2025-11-14 17:31:56,285 - INFO - Processing document 4_2024-07-31
2025-11-14 17:31:56,310 - INFO - Finished converting document 4_2024-07-31 in 0.05 sec.
2025-11-14 17:31:56,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\4_2024-05-14' --> 'data\processed_data\RTX\4_2024-05-14.md'
Converted 'data\edgar_documents\RTX\4_2024-07-30' --> 'data\processed_data\RTX\4_2024-07-30.md'
Converted 'data\edgar_documents\RTX\4_2024-07-31' --> 'data\processed_data\RTX\4_2024-07-31.md'


2025-11-14 17:31:56,390 - INFO - Going to convert document batch...
2025-11-14 17:31:56,391 - INFO - Processing document 4_2024-08-01
2025-11-14 17:31:56,432 - INFO - Finished converting document 4_2024-08-01 in 0.11 sec.
2025-11-14 17:31:56,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:56,513 - INFO - Going to convert document batch...
2025-11-14 17:31:56,515 - INFO - Processing document 4_2024-10-03
2025-11-14 17:31:56,541 - INFO - Finished converting document 4_2024-10-03 in 0.05 sec.
2025-11-14 17:31:56,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:56,596 - INFO - Going to convert document batch...
2025-11-14 17:31:56,597 - INFO - Processing document 4_2024-12-19
2025-11-14 17:31:56,624 - INFO - Finished converting document 4_2024-12-19 in 0.06 sec.
2025-11-14 17:31:56,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\4_2024-08-01' --> 'data\processed_data\RTX\4_2024-08-01.md'
Converted 'data\edgar_documents\RTX\4_2024-10-03' --> 'data\processed_data\RTX\4_2024-10-03.md'
Converted 'data\edgar_documents\RTX\4_2024-12-19' --> 'data\processed_data\RTX\4_2024-12-19.md'


2025-11-14 17:31:56,683 - INFO - Going to convert document batch...
2025-11-14 17:31:56,684 - INFO - Processing document 4_2025-02-06
2025-11-14 17:31:56,709 - INFO - Finished converting document 4_2025-02-06 in 0.05 sec.
2025-11-14 17:31:56,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:56,759 - INFO - Going to convert document batch...
2025-11-14 17:31:56,759 - INFO - Processing document 4_2025-02-10
2025-11-14 17:31:56,783 - INFO - Finished converting document 4_2025-02-10 in 0.05 sec.
2025-11-14 17:31:56,818 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\4_2025-02-06' --> 'data\processed_data\RTX\4_2025-02-06.md'
Converted 'data\edgar_documents\RTX\4_2025-02-10' --> 'data\processed_data\RTX\4_2025-02-10.md'


2025-11-14 17:31:57,241 - INFO - Going to convert document batch...
2025-11-14 17:31:57,242 - INFO - Processing document 4_2025-02-19
2025-11-14 17:31:57,262 - INFO - Finished converting document 4_2025-02-19 in 0.47 sec.
2025-11-14 17:31:57,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:57,316 - INFO - Going to convert document batch...
2025-11-14 17:31:57,318 - INFO - Processing document 4_2025-02-26
2025-11-14 17:31:57,350 - INFO - Finished converting document 4_2025-02-26 in 0.06 sec.
2025-11-14 17:31:57,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:57,396 - INFO - Going to convert document batch...
2025-11-14 17:31:57,397 - INFO - Processing document 4_2025-02-27
2025-11-14 17:31:57,424 - INFO - Finished converting document 4_2025-02-27 in 0.05 sec.
2025-11-14 17:31:57,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:57,467 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\RTX\4_2025-02-19' --> 'data\processed_data\RTX\4_2025-02-19.md'
Converted 'data\edgar_documents\RTX\4_2025-02-26' --> 'data\processed_data\RTX\4_2025-02-26.md'
Converted 'data\edgar_documents\RTX\4_2025-02-27' --> 'data\processed_data\RTX\4_2025-02-27.md'


2025-11-14 17:31:57,467 - INFO - Processing document 4_2025-03-03
2025-11-14 17:31:57,486 - INFO - Finished converting document 4_2025-03-03 in 0.03 sec.
2025-11-14 17:31:57,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:57,533 - INFO - Going to convert document batch...
2025-11-14 17:31:57,534 - INFO - Processing document 4_2025-04-23
2025-11-14 17:31:57,555 - INFO - Finished converting document 4_2025-04-23 in 0.05 sec.
2025-11-14 17:31:57,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:57,598 - INFO - Going to convert document batch...
2025-11-14 17:31:57,599 - INFO - Processing document 4_2025-05-05
2025-11-14 17:31:57,619 - INFO - Finished converting document 4_2025-05-05 in 0.03 sec.
2025-11-14 17:31:57,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:57,665 - INFO - Going to convert document batch...
2025-11-14 17:31:57,666 - INFO - Processing document 4_2025-05-08


Converted 'data\edgar_documents\RTX\4_2025-03-03' --> 'data\processed_data\RTX\4_2025-03-03.md'
Converted 'data\edgar_documents\RTX\4_2025-04-23' --> 'data\processed_data\RTX\4_2025-04-23.md'
Converted 'data\edgar_documents\RTX\4_2025-05-05' --> 'data\processed_data\RTX\4_2025-05-05.md'


2025-11-14 17:31:57,693 - INFO - Finished converting document 4_2025-05-08 in 0.05 sec.
2025-11-14 17:31:57,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:57,737 - INFO - Going to convert document batch...
2025-11-14 17:31:57,738 - INFO - Processing document 4_2025-05-21
2025-11-14 17:31:57,757 - INFO - Finished converting document 4_2025-05-21 in 0.03 sec.
2025-11-14 17:31:57,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:57,824 - INFO - Going to convert document batch...
2025-11-14 17:31:57,825 - INFO - Processing document 4_2025-06-05
2025-11-14 17:31:57,862 - INFO - Finished converting document 4_2025-06-05 in 0.08 sec.
2025-11-14 17:31:57,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\4_2025-05-08' --> 'data\processed_data\RTX\4_2025-05-08.md'
Converted 'data\edgar_documents\RTX\4_2025-05-21' --> 'data\processed_data\RTX\4_2025-05-21.md'
Converted 'data\edgar_documents\RTX\4_2025-06-05' --> 'data\processed_data\RTX\4_2025-06-05.md'


2025-11-14 17:31:57,919 - INFO - Going to convert document batch...
2025-11-14 17:31:57,919 - INFO - Processing document 4_2025-07-25
2025-11-14 17:31:57,941 - INFO - Finished converting document 4_2025-07-25 in 0.05 sec.
2025-11-14 17:31:57,977 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:57,988 - INFO - Going to convert document batch...
2025-11-14 17:31:57,988 - INFO - Processing document 4_2025-07-28
2025-11-14 17:31:58,012 - INFO - Finished converting document 4_2025-07-28 in 0.05 sec.
2025-11-14 17:31:58,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,059 - INFO - Going to convert document batch...
2025-11-14 17:31:58,060 - INFO - Processing document 4_2025-08-06
2025-11-14 17:31:58,085 - INFO - Finished converting document 4_2025-08-06 in 0.05 sec.
2025-11-14 17:31:58,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,134 - INFO - Going to convert document batch...
2025-11-14 17:31:58,135 - 

Converted 'data\edgar_documents\RTX\4_2025-07-25' --> 'data\processed_data\RTX\4_2025-07-25.md'
Converted 'data\edgar_documents\RTX\4_2025-07-28' --> 'data\processed_data\RTX\4_2025-07-28.md'
Converted 'data\edgar_documents\RTX\4_2025-08-06' --> 'data\processed_data\RTX\4_2025-08-06.md'


2025-11-14 17:31:58,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,216 - INFO - Going to convert document batch...
2025-11-14 17:31:58,217 - INFO - Processing document 4_2025-08-28
2025-11-14 17:31:58,246 - INFO - Finished converting document 4_2025-08-28 in 0.06 sec.
2025-11-14 17:31:58,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,307 - INFO - Going to convert document batch...
2025-11-14 17:31:58,309 - INFO - Processing document 4_2025-10-03
2025-11-14 17:31:58,350 - INFO - Finished converting document 4_2025-10-03 in 0.08 sec.


Converted 'data\edgar_documents\RTX\4_2025-08-13' --> 'data\processed_data\RTX\4_2025-08-13.md'
Converted 'data\edgar_documents\RTX\4_2025-08-28' --> 'data\processed_data\RTX\4_2025-08-28.md'


2025-11-14 17:31:58,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,409 - INFO - Going to convert document batch...
2025-11-14 17:31:58,410 - INFO - Processing document 4_2025-10-28
2025-11-14 17:31:58,438 - INFO - Finished converting document 4_2025-10-28 in 0.06 sec.
2025-11-14 17:31:58,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,492 - INFO - Going to convert document batch...
2025-11-14 17:31:58,492 - INFO - Processing document 4_2025-10-29
2025-11-14 17:31:58,519 - INFO - Finished converting document 4_2025-10-29 in 0.05 sec.
2025-11-14 17:31:58,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\4_2025-10-03' --> 'data\processed_data\RTX\4_2025-10-03.md'
Converted 'data\edgar_documents\RTX\4_2025-10-28' --> 'data\processed_data\RTX\4_2025-10-28.md'
Converted 'data\edgar_documents\RTX\4_2025-10-29' --> 'data\processed_data\RTX\4_2025-10-29.md'


2025-11-14 17:31:58,591 - INFO - Going to convert document batch...
2025-11-14 17:31:58,592 - INFO - Processing document 8-K_2023-01-17
2025-11-14 17:31:58,625 - INFO - Finished converting document 8-K_2023-01-17 in 0.08 sec.
2025-11-14 17:31:58,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,692 - INFO - Going to convert document batch...
2025-11-14 17:31:58,693 - INFO - Processing document 8-K_2023-01-24
2025-11-14 17:31:58,715 - INFO - Finished converting document 8-K_2023-01-24 in 0.06 sec.
2025-11-14 17:31:58,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,758 - INFO - Going to convert document batch...
2025-11-14 17:31:58,759 - INFO - Processing document 8-K_2023-02-21
2025-11-14 17:31:58,785 - INFO - Finished converting document 8-K_2023-02-21 in 0.06 sec.
2025-11-14 17:31:58,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,829 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\RTX\8-K_2023-01-17' --> 'data\processed_data\RTX\8-K_2023-01-17.md'
Converted 'data\edgar_documents\RTX\8-K_2023-01-24' --> 'data\processed_data\RTX\8-K_2023-01-24.md'
Converted 'data\edgar_documents\RTX\8-K_2023-02-21' --> 'data\processed_data\RTX\8-K_2023-02-21.md'


2025-11-14 17:31:58,853 - INFO - Finished converting document 8-K_2023-02-27 in 0.05 sec.
2025-11-14 17:31:58,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,896 - INFO - Going to convert document batch...
2025-11-14 17:31:58,897 - INFO - Processing document 8-K_2023-04-25
2025-11-14 17:31:58,917 - INFO - Finished converting document 8-K_2023-04-25 in 0.06 sec.
2025-11-14 17:31:58,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:58,975 - INFO - Going to convert document batch...
2025-11-14 17:31:58,976 - INFO - Processing document 8-K_2023-05-04
2025-11-14 17:31:59,026 - INFO - Finished converting document 8-K_2023-05-04 in 0.11 sec.


Converted 'data\edgar_documents\RTX\8-K_2023-02-27' --> 'data\processed_data\RTX\8-K_2023-02-27.md'
Converted 'data\edgar_documents\RTX\8-K_2023-04-25' --> 'data\processed_data\RTX\8-K_2023-04-25.md'


2025-11-14 17:31:59,059 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,075 - INFO - Going to convert document batch...
2025-11-14 17:31:59,076 - INFO - Processing document 8-K_2023-06-20
2025-11-14 17:31:59,101 - INFO - Finished converting document 8-K_2023-06-20 in 0.05 sec.
2025-11-14 17:31:59,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,147 - INFO - Going to convert document batch...
2025-11-14 17:31:59,149 - INFO - Processing document 8-K_2023-07-17
2025-11-14 17:31:59,183 - INFO - Finished converting document 8-K_2023-07-17 in 0.08 sec.
2025-11-14 17:31:59,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,244 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\RTX\8-K_2023-05-04' --> 'data\processed_data\RTX\8-K_2023-05-04.md'
Converted 'data\edgar_documents\RTX\8-K_2023-06-20' --> 'data\processed_data\RTX\8-K_2023-06-20.md'
Converted 'data\edgar_documents\RTX\8-K_2023-07-17' --> 'data\processed_data\RTX\8-K_2023-07-17.md'


2025-11-14 17:31:59,245 - INFO - Processing document 8-K_2023-07-25
2025-11-14 17:31:59,273 - INFO - Finished converting document 8-K_2023-07-25 in 0.06 sec.
2025-11-14 17:31:59,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,325 - INFO - Going to convert document batch...
2025-11-14 17:31:59,327 - INFO - Processing document 8-K_2023-09-11
2025-11-14 17:31:59,364 - INFO - Finished converting document 8-K_2023-09-11 in 0.06 sec.
2025-11-14 17:31:59,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,419 - INFO - Going to convert document batch...
2025-11-14 17:31:59,420 - INFO - Processing document 8-K_2023-10-24
2025-11-14 17:31:59,447 - INFO - Finished converting document 8-K_2023-10-24 in 0.06 sec.


Converted 'data\edgar_documents\RTX\8-K_2023-07-25' --> 'data\processed_data\RTX\8-K_2023-07-25.md'
Converted 'data\edgar_documents\RTX\8-K_2023-09-11' --> 'data\processed_data\RTX\8-K_2023-09-11.md'


2025-11-14 17:31:59,477 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:31:59,478 - ERROR - Input document 8-K_2023-10-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:31:59,480 - INFO - Going to convert document batch...
2025-11-14 17:31:59,496 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,514 - INFO - Going to convert document batch...
2025-11-14 17:31:59,515 - INFO - Processing document 8-K_2023-11

Converted 'data\edgar_documents\RTX\8-K_2023-10-24' --> 'data\processed_data\RTX\8-K_2023-10-24.md'
Error processing data\edgar_documents\RTX\8-K_2023-10-25: File format not allowed: data\edgar_documents\RTX\8-K_2023-10-25
Converted 'data\edgar_documents\RTX\8-K_2023-11-08' --> 'data\processed_data\RTX\8-K_2023-11-08.md'
Converted 'data\edgar_documents\RTX\8-K_2023-11-22' --> 'data\processed_data\RTX\8-K_2023-11-22.md'


2025-11-14 17:31:59,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,695 - INFO - Going to convert document batch...
2025-11-14 17:31:59,696 - INFO - Processing document 8-K_2023-12-14
2025-11-14 17:31:59,718 - INFO - Finished converting document 8-K_2023-12-14 in 0.08 sec.
2025-11-14 17:31:59,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,761 - INFO - Going to convert document batch...
2025-11-14 17:31:59,762 - INFO - Processing document 8-K_2024-01-04
2025-11-14 17:31:59,785 - INFO - Finished converting document 8-K_2024-01-04 in 0.05 sec.
2025-11-14 17:31:59,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,842 - INFO - Going to convert document batch...
2025-11-14 17:31:59,844 - INFO - Processing document 8-K_2024-01-23
2025-11-14 17:31:59,871 - INFO - Finished converting document 8-K_2024-01-23 in 0.08 sec.


Converted 'data\edgar_documents\RTX\8-K_2023-12-14' --> 'data\processed_data\RTX\8-K_2023-12-14.md'
Converted 'data\edgar_documents\RTX\8-K_2024-01-04' --> 'data\processed_data\RTX\8-K_2024-01-04.md'
Converted 'data\edgar_documents\RTX\8-K_2024-01-23' --> 'data\processed_data\RTX\8-K_2024-01-23.md'


2025-11-14 17:31:59,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:31:59,964 - INFO - Going to convert document batch...
2025-11-14 17:31:59,965 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:31:59,995 - INFO - Finished converting document 8-K_2024-04-23 in 0.09 sec.
2025-11-14 17:32:00,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:32:00,109 - INFO - Going to convert document batch...
2025-11-14 17:32:00,111 - INFO - Processing document 8-K_2024-05-06
2025-11-14 17:32:00,174 - INFO - Finished converting document 8-K_2024-05-06 in 0.16 sec.


Converted 'data\edgar_documents\RTX\8-K_2024-04-23' --> 'data\processed_data\RTX\8-K_2024-04-23.md'


2025-11-14 17:32:00,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:32:00,247 - INFO - Going to convert document batch...
2025-11-14 17:32:00,248 - INFO - Processing document 8-K_2024-07-17
2025-11-14 17:32:00,284 - INFO - Finished converting document 8-K_2024-07-17 in 0.08 sec.
2025-11-14 17:32:00,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:32:00,337 - INFO - Going to convert document batch...
2025-11-14 17:32:00,338 - INFO - Processing document 8-K_2024-07-25
2025-11-14 17:32:00,368 - INFO - Finished converting document 8-K_2024-07-25 in 0.06 sec.
2025-11-14 17:32:00,405 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\RTX\8-K_2024-05-06' --> 'data\processed_data\RTX\8-K_2024-05-06.md'
Converted 'data\edgar_documents\RTX\8-K_2024-07-17' --> 'data\processed_data\RTX\8-K_2024-07-17.md'
Converted 'data\edgar_documents\RTX\8-K_2024-07-25' --> 'data\processed_data\RTX\8-K_2024-07-25.md'


2025-11-14 17:32:00,405 - ERROR - Input document 8-K_2024-07-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:32:00,407 - INFO - Going to convert document batch...
2025-11-14 17:32:00,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:32:00,438 - INFO - Going to convert document batch...
2025-11-14 17:32:00,439 - INFO - Processing document 8-K_2024-08-30
2025-11-14 17:32:00,465 - INFO - Finished converting document 8-K_2024-08-30 in 0.06 sec.
2025-11-14 17:32:00,497 - INFO -

Error processing data\edgar_documents\RTX\8-K_2024-07-31: File format not allowed: data\edgar_documents\RTX\8-K_2024-07-31
Converted 'data\edgar_documents\RTX\8-K_2024-08-30' --> 'data\processed_data\RTX\8-K_2024-08-30.md'
Converted 'data\edgar_documents\RTX\8-K_2024-10-16' --> 'data\processed_data\RTX\8-K_2024-10-16.md'


2025-11-14 17:32:00,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:32:00,652 - INFO - Going to convert document batch...
2025-11-14 17:32:00,652 - INFO - Processing document 8-K_2025-01-28
2025-11-14 17:32:00,674 - INFO - Finished converting document 8-K_2025-01-28 in 0.05 sec.
2025-11-14 17:32:00,705 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:32:00,705 - ERROR - Input document 8-K_2025-02-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <I

Converted 'data\edgar_documents\RTX\8-K_2024-10-22' --> 'data\processed_data\RTX\8-K_2024-10-22.md'
Converted 'data\edgar_documents\RTX\8-K_2025-01-28' --> 'data\processed_data\RTX\8-K_2025-01-28.md'
Error processing data\edgar_documents\RTX\8-K_2025-02-03: File format not allowed: data\edgar_documents\RTX\8-K_2025-02-03
Converted 'data\edgar_documents\RTX\8-K_2025-04-22' --> 'data\processed_data\RTX\8-K_2025-04-22.md'


2025-11-14 17:32:00,829 - INFO - Going to convert document batch...
2025-11-14 17:32:00,830 - INFO - Processing document 8-K_2025-05-05
2025-11-14 17:32:00,863 - INFO - Finished converting document 8-K_2025-05-05 in 0.08 sec.
2025-11-14 17:32:00,898 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:32:00,910 - INFO - Going to convert document batch...
2025-11-14 17:32:00,911 - INFO - Processing document 8-K_2025-07-22
2025-11-14 17:32:00,934 - INFO - Finished converting document 8-K_2025-07-22 in 0.06 sec.
2025-11-14 17:32:00,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:32:00,973 - INFO - Going to convert document batch...
2025-11-14 17:32:00,974 - INFO - Processing document 8-K_2025-09-24
2025-11-14 17:32:01,002 - INFO - Finished converting document 8-K_2025-09-24 in 0.05 sec.
2025-11-14 17:32:01,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:32:01,054 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\RTX\8-K_2025-05-05' --> 'data\processed_data\RTX\8-K_2025-05-05.md'
Converted 'data\edgar_documents\RTX\8-K_2025-07-22' --> 'data\processed_data\RTX\8-K_2025-07-22.md'
Converted 'data\edgar_documents\RTX\8-K_2025-09-24' --> 'data\processed_data\RTX\8-K_2025-09-24.md'


2025-11-14 17:32:01,140 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:32:01,141 - ERROR - Input document DEF-14A_2023-03-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:32:01,145 - INFO - Going to convert document batch...
2025-11-14 17:32:01,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\8-K_2025-10-21' --> 'data\processed_data\RTX\8-K_2025-10-21.md'
Error processing data\edgar_documents\RTX\DEF-14A_2023-03-13: File format not allowed: data\edgar_documents\RTX\DEF-14A_2023-03-13


2025-11-14 17:32:02,127 - INFO - Going to convert document batch...
2025-11-14 17:32:02,129 - INFO - Processing document DEF-14A_2024-03-11
2025-11-14 17:32:13,204 - INFO - Finished converting document DEF-14A_2024-03-11 in 12.06 sec.
2025-11-14 17:32:14,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\DEF-14A_2024-03-11' --> 'data\processed_data\RTX\DEF-14A_2024-03-11.md'


2025-11-14 17:32:15,502 - INFO - Going to convert document batch...
2025-11-14 17:32:15,503 - INFO - Processing document DEF-14A_2025-03-10
2025-11-14 17:32:36,873 - INFO - Finished converting document DEF-14A_2025-03-10 in 22.56 sec.
2025-11-14 17:32:38,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\RTX\DEF-14A_2025-03-10' --> 'data\processed_data\RTX\DEF-14A_2025-03-10.md'
Processed 91 new files. Errors: 8
Found 113 files to process in data\edgar_documents\SBUX


2025-11-14 17:32:39,253 - INFO - Going to convert document batch...
2025-11-14 17:32:39,254 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:32:39,254 - INFO - Processing document 10-K_2023-11-17
2025-11-14 17:32:40,931 - INFO - Finished converting document 10-K_2023-11-17 in 2.83 sec.
2025-11-14 17:32:41,596 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:32:41,597 - ERROR - Input document 10-K_2024-11-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: '

Converted 'data\edgar_documents\SBUX\10-K_2023-11-17' --> 'data\processed_data\SBUX\10-K_2023-11-17.md'
Error processing data\edgar_documents\SBUX\10-K_2024-11-20: File format not allowed: data\edgar_documents\SBUX\10-K_2024-11-20


2025-11-14 17:32:42,318 - INFO - Going to convert document batch...
2025-11-14 17:32:42,319 - INFO - Processing document 10-Q_2023-02-02
2025-11-14 17:32:43,159 - INFO - Finished converting document 10-Q_2023-02-02 in 1.56 sec.
2025-11-14 17:32:43,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\10-Q_2023-02-02' --> 'data\processed_data\SBUX\10-Q_2023-02-02.md'


2025-11-14 17:32:44,148 - INFO - Going to convert document batch...
2025-11-14 17:32:44,149 - INFO - Processing document 10-Q_2023-05-02
2025-11-14 17:32:45,584 - INFO - Finished converting document 10-Q_2023-05-02 in 2.00 sec.
2025-11-14 17:32:46,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\10-Q_2023-05-02' --> 'data\processed_data\SBUX\10-Q_2023-05-02.md'


2025-11-14 17:32:46,660 - INFO - Going to convert document batch...
2025-11-14 17:32:46,662 - INFO - Processing document 10-Q_2023-08-01
2025-11-14 17:32:47,700 - INFO - Finished converting document 10-Q_2023-08-01 in 1.61 sec.
2025-11-14 17:32:48,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\10-Q_2023-08-01' --> 'data\processed_data\SBUX\10-Q_2023-08-01.md'


2025-11-14 17:32:49,064 - INFO - Going to convert document batch...
2025-11-14 17:32:49,065 - INFO - Processing document 10-Q_2024-01-30
2025-11-14 17:32:49,937 - INFO - Finished converting document 10-Q_2024-01-30 in 1.31 sec.
2025-11-14 17:32:50,384 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:32:50,385 - ERROR - Input document 10-Q_2024-02-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:32:50,386 - INFO - Going to convert d

Converted 'data\edgar_documents\SBUX\10-Q_2024-01-30' --> 'data\processed_data\SBUX\10-Q_2024-01-30.md'
Error processing data\edgar_documents\SBUX\10-Q_2024-02-16: File format not allowed: data\edgar_documents\SBUX\10-Q_2024-02-16


2025-11-14 17:32:51,282 - INFO - Going to convert document batch...
2025-11-14 17:32:51,284 - INFO - Processing document 10-Q_2024-04-30
2025-11-14 17:32:52,308 - INFO - Finished converting document 10-Q_2024-04-30 in 1.92 sec.
2025-11-14 17:32:52,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\10-Q_2024-04-30' --> 'data\processed_data\SBUX\10-Q_2024-04-30.md'


2025-11-14 17:32:53,746 - INFO - Going to convert document batch...
2025-11-14 17:32:53,747 - INFO - Processing document 10-Q_2024-07-30
2025-11-14 17:32:54,754 - INFO - Finished converting document 10-Q_2024-07-30 in 1.88 sec.
2025-11-14 17:32:55,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\10-Q_2024-07-30' --> 'data\processed_data\SBUX\10-Q_2024-07-30.md'


2025-11-14 17:32:55,773 - INFO - Going to convert document batch...
2025-11-14 17:32:55,773 - INFO - Processing document 10-Q_2025-01-28
2025-11-14 17:32:56,559 - INFO - Finished converting document 10-Q_2025-01-28 in 1.27 sec.
2025-11-14 17:32:57,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\10-Q_2025-01-28' --> 'data\processed_data\SBUX\10-Q_2025-01-28.md'


2025-11-14 17:32:57,948 - INFO - Going to convert document batch...
2025-11-14 17:32:57,949 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 17:32:58,935 - INFO - Finished converting document 10-Q_2025-04-29 in 1.95 sec.
2025-11-14 17:32:59,481 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\10-Q_2025-04-29' --> 'data\processed_data\SBUX\10-Q_2025-04-29.md'


2025-11-14 17:33:00,375 - INFO - Going to convert document batch...
2025-11-14 17:33:00,375 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 17:33:01,409 - INFO - Finished converting document 10-Q_2025-07-29 in 1.97 sec.
2025-11-14 17:33:02,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,051 - INFO - Going to convert document batch...
2025-11-14 17:33:02,052 - INFO - Processing document 4_2023-01-11
2025-11-14 17:33:02,081 - INFO - Finished converting document 4_2023-01-11 in 0.08 sec.
2025-11-14 17:33:02,179 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:33:02,181 - ERROR - Input document 4_2023-02-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, 

Converted 'data\edgar_documents\SBUX\10-Q_2025-07-29' --> 'data\processed_data\SBUX\10-Q_2025-07-29.md'
Converted 'data\edgar_documents\SBUX\4_2023-01-11' --> 'data\processed_data\SBUX\4_2023-01-11.md'


2025-11-14 17:33:02,219 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:33:02,219 - ERROR - Input document 4_2023-02-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:33:02,220 - INFO - Going to convert document batch...
2025-11-14 17:33:02,238 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,251 - INFO - Going to convert document batch...
2025-11-14 17:33:02,252 - INFO - Processing document 4_2023-02-15
2025-11-14 17:33:02,275 - INFO - Fin

Error processing data\edgar_documents\SBUX\4_2023-02-07: File format not allowed: data\edgar_documents\SBUX\4_2023-02-07
Error processing data\edgar_documents\SBUX\4_2023-02-09: File format not allowed: data\edgar_documents\SBUX\4_2023-02-09
Converted 'data\edgar_documents\SBUX\4_2023-02-15' --> 'data\processed_data\SBUX\4_2023-02-15.md'


2025-11-14 17:33:02,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,401 - INFO - Going to convert document batch...
2025-11-14 17:33:02,402 - INFO - Processing document 4_2023-02-21
2025-11-14 17:33:02,419 - INFO - Finished converting document 4_2023-02-21 in 0.05 sec.
2025-11-14 17:33:02,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,472 - INFO - Going to convert document batch...
2025-11-14 17:33:02,473 - INFO - Processing document 4_2023-02-23
2025-11-14 17:33:02,492 - INFO - Finished converting document 4_2023-02-23 in 0.05 sec.
2025-11-14 17:33:02,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,539 - INFO - Going to convert document batch...
2025-11-14 17:33:02,540 - INFO - Processing document 4_2023-03-29
2025-11-14 17:33:02,558 - INFO - Finished converting document 4_2023-03-29 in 0.05 sec.


Converted 'data\edgar_documents\SBUX\4_2023-02-17' --> 'data\processed_data\SBUX\4_2023-02-17.md'
Converted 'data\edgar_documents\SBUX\4_2023-02-21' --> 'data\processed_data\SBUX\4_2023-02-21.md'
Converted 'data\edgar_documents\SBUX\4_2023-02-23' --> 'data\processed_data\SBUX\4_2023-02-23.md'


2025-11-14 17:33:02,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,606 - INFO - Going to convert document batch...
2025-11-14 17:33:02,607 - INFO - Processing document 4_2023-05-17
2025-11-14 17:33:02,626 - INFO - Finished converting document 4_2023-05-17 in 0.05 sec.
2025-11-14 17:33:02,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,675 - INFO - Going to convert document batch...
2025-11-14 17:33:02,676 - INFO - Processing document 4_2023-06-20
2025-11-14 17:33:02,714 - INFO - Finished converting document 4_2023-06-20 in 0.08 sec.
2025-11-14 17:33:02,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,770 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SBUX\4_2023-03-29' --> 'data\processed_data\SBUX\4_2023-03-29.md'
Converted 'data\edgar_documents\SBUX\4_2023-05-17' --> 'data\processed_data\SBUX\4_2023-05-17.md'
Converted 'data\edgar_documents\SBUX\4_2023-06-20' --> 'data\processed_data\SBUX\4_2023-06-20.md'


2025-11-14 17:33:02,771 - INFO - Processing document 4_2023-06-23
2025-11-14 17:33:02,798 - INFO - Finished converting document 4_2023-06-23 in 0.06 sec.
2025-11-14 17:33:02,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,846 - INFO - Going to convert document batch...
2025-11-14 17:33:02,847 - INFO - Processing document 4_2023-08-17
2025-11-14 17:33:02,868 - INFO - Finished converting document 4_2023-08-17 in 0.03 sec.
2025-11-14 17:33:02,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,909 - INFO - Going to convert document batch...
2025-11-14 17:33:02,909 - INFO - Processing document 4_2023-09-19
2025-11-14 17:33:02,930 - INFO - Finished converting document 4_2023-09-19 in 0.03 sec.
2025-11-14 17:33:02,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:02,967 - INFO - Going to convert document batch...
2025-11-14 17:33:02,968 - INFO - Processing document 4_2023-10-03
2025-11-14 17:33:02,987 - IN

Converted 'data\edgar_documents\SBUX\4_2023-06-23' --> 'data\processed_data\SBUX\4_2023-06-23.md'
Converted 'data\edgar_documents\SBUX\4_2023-08-17' --> 'data\processed_data\SBUX\4_2023-08-17.md'
Converted 'data\edgar_documents\SBUX\4_2023-09-19' --> 'data\processed_data\SBUX\4_2023-09-19.md'
Converted 'data\edgar_documents\SBUX\4_2023-10-03' --> 'data\processed_data\SBUX\4_2023-10-03.md'


2025-11-14 17:33:03,045 - INFO - Going to convert document batch...
2025-11-14 17:33:03,046 - INFO - Processing document 4_2023-10-04
2025-11-14 17:33:03,067 - INFO - Finished converting document 4_2023-10-04 in 0.06 sec.
2025-11-14 17:33:03,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,107 - INFO - Going to convert document batch...
2025-11-14 17:33:03,108 - INFO - Processing document 4_2023-11-09
2025-11-14 17:33:03,129 - INFO - Finished converting document 4_2023-11-09 in 0.05 sec.
2025-11-14 17:33:03,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,185 - INFO - Going to convert document batch...
2025-11-14 17:33:03,186 - INFO - Processing document 4_2023-11-14
2025-11-14 17:33:03,203 - INFO - Finished converting document 4_2023-11-14 in 0.06 sec.
2025-11-14 17:33:03,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,242 - INFO - Going to convert document batch...
2025-11-14 17:33:03,242 - 

Converted 'data\edgar_documents\SBUX\4_2023-10-04' --> 'data\processed_data\SBUX\4_2023-10-04.md'
Converted 'data\edgar_documents\SBUX\4_2023-11-09' --> 'data\processed_data\SBUX\4_2023-11-09.md'
Converted 'data\edgar_documents\SBUX\4_2023-11-14' --> 'data\processed_data\SBUX\4_2023-11-14.md'


2025-11-14 17:33:03,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,297 - INFO - Going to convert document batch...
2025-11-14 17:33:03,298 - INFO - Processing document 4_2023-11-16
2025-11-14 17:33:03,318 - INFO - Finished converting document 4_2023-11-16 in 0.03 sec.
2025-11-14 17:33:03,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,378 - INFO - Going to convert document batch...
2025-11-14 17:33:03,379 - INFO - Processing document 4_2023-11-17
2025-11-14 17:33:03,397 - INFO - Finished converting document 4_2023-11-17 in 0.05 sec.
2025-11-14 17:33:03,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,436 - INFO - Going to convert document batch...
2025-11-14 17:33:03,437 - INFO - Processing document 4_2023-11-20
2025-11-14 17:33:03,456 - INFO - Finished converting document 4_2023-11-20 in 0.03 sec.


Converted 'data\edgar_documents\SBUX\4_2023-11-15' --> 'data\processed_data\SBUX\4_2023-11-15.md'
Converted 'data\edgar_documents\SBUX\4_2023-11-16' --> 'data\processed_data\SBUX\4_2023-11-16.md'
Converted 'data\edgar_documents\SBUX\4_2023-11-17' --> 'data\processed_data\SBUX\4_2023-11-17.md'


2025-11-14 17:33:03,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,497 - INFO - Going to convert document batch...
2025-11-14 17:33:03,497 - INFO - Processing document 4_2023-11-22
2025-11-14 17:33:03,520 - INFO - Finished converting document 4_2023-11-22 in 0.05 sec.
2025-11-14 17:33:03,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,560 - INFO - Going to convert document batch...
2025-11-14 17:33:03,561 - INFO - Processing document 4_2023-12-22
2025-11-14 17:33:03,579 - INFO - Finished converting document 4_2023-12-22 in 0.05 sec.
2025-11-14 17:33:03,614 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,625 - INFO - Going to convert document batch...
2025-11-14 17:33:03,625 - INFO - Processing document 4_2024-01-18
2025-11-14 17:33:03,644 - INFO - Finished converting document 4_2024-01-18 in 0.05 sec.


Converted 'data\edgar_documents\SBUX\4_2023-11-20' --> 'data\processed_data\SBUX\4_2023-11-20.md'
Converted 'data\edgar_documents\SBUX\4_2023-11-22' --> 'data\processed_data\SBUX\4_2023-11-22.md'
Converted 'data\edgar_documents\SBUX\4_2023-12-22' --> 'data\processed_data\SBUX\4_2023-12-22.md'
Converted 'data\edgar_documents\SBUX\4_2024-01-18' --> 'data\processed_data\SBUX\4_2024-01-18.md'


2025-11-14 17:33:03,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,702 - INFO - Going to convert document batch...
2025-11-14 17:33:03,702 - INFO - Processing document 4_2024-01-23
2025-11-14 17:33:03,720 - INFO - Finished converting document 4_2024-01-23 in 0.06 sec.
2025-11-14 17:33:03,763 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:33:03,764 - ERROR - Input document 4_2024-02-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:33

Converted 'data\edgar_documents\SBUX\4_2024-01-23' --> 'data\processed_data\SBUX\4_2024-01-23.md'
Error processing data\edgar_documents\SBUX\4_2024-02-05: File format not allowed: data\edgar_documents\SBUX\4_2024-02-05
Error processing data\edgar_documents\SBUX\4_2024-02-06: File format not allowed: data\edgar_documents\SBUX\4_2024-02-06
Converted 'data\edgar_documents\SBUX\4_2024-02-16' --> 'data\processed_data\SBUX\4_2024-02-16.md'
Converted 'data\edgar_documents\SBUX\4_2024-02-22' --> 'data\processed_data\SBUX\4_2024-02-22.md'


2025-11-14 17:33:03,920 - INFO - Processing document 4_2024-03-06
2025-11-14 17:33:03,940 - INFO - Finished converting document 4_2024-03-06 in 0.05 sec.
2025-11-14 17:33:03,975 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:03,983 - INFO - Going to convert document batch...
2025-11-14 17:33:03,983 - INFO - Processing document 4_2024-03-15
2025-11-14 17:33:04,002 - INFO - Finished converting document 4_2024-03-15 in 0.05 sec.
2025-11-14 17:33:04,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:04,043 - INFO - Going to convert document batch...
2025-11-14 17:33:04,044 - INFO - Processing document 4_2024-03-25
2025-11-14 17:33:04,062 - INFO - Finished converting document 4_2024-03-25 in 0.05 sec.
2025-11-14 17:33:04,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:04,101 - INFO - Going to convert document batch...
2025-11-14 17:33:04,102 - INFO - Processing document 4_2024-04-17
2025-11-14 17:33:04,120 - IN

Converted 'data\edgar_documents\SBUX\4_2024-03-06' --> 'data\processed_data\SBUX\4_2024-03-06.md'
Converted 'data\edgar_documents\SBUX\4_2024-03-15' --> 'data\processed_data\SBUX\4_2024-03-15.md'
Converted 'data\edgar_documents\SBUX\4_2024-03-25' --> 'data\processed_data\SBUX\4_2024-03-25.md'


2025-11-14 17:33:04,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:04,162 - INFO - Going to convert document batch...
2025-11-14 17:33:04,162 - INFO - Processing document 4_2024-04-24
2025-11-14 17:33:04,182 - INFO - Finished converting document 4_2024-04-24 in 0.03 sec.
2025-11-14 17:33:04,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:04,233 - INFO - Going to convert document batch...
2025-11-14 17:33:04,234 - INFO - Processing document 4_2024-05-17
2025-11-14 17:33:04,254 - INFO - Finished converting document 4_2024-05-17 in 0.05 sec.
2025-11-14 17:33:04,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:04,292 - INFO - Going to convert document batch...
2025-11-14 17:33:04,293 - INFO - Processing document 4_2024-05-23
2025-11-14 17:33:04,310 - INFO - Finished converting document 4_2024-05-23 in 0.05 sec.


Converted 'data\edgar_documents\SBUX\4_2024-04-17' --> 'data\processed_data\SBUX\4_2024-04-17.md'
Converted 'data\edgar_documents\SBUX\4_2024-04-24' --> 'data\processed_data\SBUX\4_2024-04-24.md'
Converted 'data\edgar_documents\SBUX\4_2024-05-17' --> 'data\processed_data\SBUX\4_2024-05-17.md'


2025-11-14 17:33:04,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:04,347 - INFO - Going to convert document batch...
2025-11-14 17:33:04,348 - INFO - Processing document 4_2024-05-24
2025-11-14 17:33:04,369 - INFO - Finished converting document 4_2024-05-24 in 0.03 sec.
2025-11-14 17:33:04,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\4_2024-05-23' --> 'data\processed_data\SBUX\4_2024-05-23.md'
Converted 'data\edgar_documents\SBUX\4_2024-05-24' --> 'data\processed_data\SBUX\4_2024-05-24.md'


2025-11-14 17:33:04,805 - INFO - Going to convert document batch...
2025-11-14 17:33:04,807 - INFO - Processing document 4_2024-06-18
2025-11-14 17:33:04,826 - INFO - Finished converting document 4_2024-06-18 in 0.42 sec.
2025-11-14 17:33:04,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:04,869 - INFO - Going to convert document batch...
2025-11-14 17:33:04,869 - INFO - Processing document 4_2024-06-20
2025-11-14 17:33:04,890 - INFO - Finished converting document 4_2024-06-20 in 0.05 sec.
2025-11-14 17:33:04,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:04,931 - INFO - Going to convert document batch...
2025-11-14 17:33:04,932 - INFO - Processing document 4_2024-08-15
2025-11-14 17:33:04,950 - INFO - Finished converting document 4_2024-08-15 in 0.05 sec.
2025-11-14 17:33:04,981 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:04,990 - INFO - Going to convert document batch...
2025-11-14 17:33:04,990 - 

Converted 'data\edgar_documents\SBUX\4_2024-06-18' --> 'data\processed_data\SBUX\4_2024-06-18.md'
Converted 'data\edgar_documents\SBUX\4_2024-06-20' --> 'data\processed_data\SBUX\4_2024-06-20.md'
Converted 'data\edgar_documents\SBUX\4_2024-08-15' --> 'data\processed_data\SBUX\4_2024-08-15.md'


2025-11-14 17:33:05,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,049 - INFO - Going to convert document batch...
2025-11-14 17:33:05,049 - INFO - Processing document 4_2024-09-17
2025-11-14 17:33:05,066 - INFO - Finished converting document 4_2024-09-17 in 0.03 sec.
2025-11-14 17:33:05,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,126 - INFO - Going to convert document batch...
2025-11-14 17:33:05,127 - INFO - Processing document 4_2024-11-13
2025-11-14 17:33:05,148 - INFO - Finished converting document 4_2024-11-13 in 0.05 sec.
2025-11-14 17:33:05,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,186 - INFO - Going to convert document batch...
2025-11-14 17:33:05,187 - INFO - Processing document 4_2024-11-18
2025-11-14 17:33:05,206 - INFO - Finished converting document 4_2024-11-18 in 0.03 sec.


Converted 'data\edgar_documents\SBUX\4_2024-08-19' --> 'data\processed_data\SBUX\4_2024-08-19.md'
Converted 'data\edgar_documents\SBUX\4_2024-09-17' --> 'data\processed_data\SBUX\4_2024-09-17.md'
Converted 'data\edgar_documents\SBUX\4_2024-11-13' --> 'data\processed_data\SBUX\4_2024-11-13.md'


2025-11-14 17:33:05,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,248 - INFO - Going to convert document batch...
2025-11-14 17:33:05,249 - INFO - Processing document 4_2024-11-20
2025-11-14 17:33:05,271 - INFO - Finished converting document 4_2024-11-20 in 0.05 sec.
2025-11-14 17:33:05,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,314 - INFO - Going to convert document batch...
2025-11-14 17:33:05,315 - INFO - Processing document 4_2024-11-22
2025-11-14 17:33:05,332 - INFO - Finished converting document 4_2024-11-22 in 0.03 sec.
2025-11-14 17:33:05,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,386 - INFO - Going to convert document batch...
2025-11-14 17:33:05,386 - INFO - Processing document 4_2024-12-03
2025-11-14 17:33:05,411 - INFO - Finished converting document 4_2024-12-03 in 0.06 sec.


Converted 'data\edgar_documents\SBUX\4_2024-11-18' --> 'data\processed_data\SBUX\4_2024-11-18.md'
Converted 'data\edgar_documents\SBUX\4_2024-11-20' --> 'data\processed_data\SBUX\4_2024-11-20.md'
Converted 'data\edgar_documents\SBUX\4_2024-11-22' --> 'data\processed_data\SBUX\4_2024-11-22.md'


2025-11-14 17:33:05,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,455 - INFO - Going to convert document batch...
2025-11-14 17:33:05,456 - INFO - Processing document 4_2025-02-19
2025-11-14 17:33:05,475 - INFO - Finished converting document 4_2025-02-19 in 0.03 sec.
2025-11-14 17:33:05,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,523 - INFO - Going to convert document batch...
2025-11-14 17:33:05,524 - INFO - Processing document 4_2025-03-14
2025-11-14 17:33:05,543 - INFO - Finished converting document 4_2025-03-14 in 0.05 sec.
2025-11-14 17:33:05,601 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,611 - INFO - Going to convert document batch...
2025-11-14 17:33:05,612 - INFO - Processing document 4_2025-03-18
2025-11-14 17:33:05,631 - INFO - Finished converting document 4_2025-03-18 in 0.05 sec.


Converted 'data\edgar_documents\SBUX\4_2024-12-03' --> 'data\processed_data\SBUX\4_2024-12-03.md'
Converted 'data\edgar_documents\SBUX\4_2025-02-19' --> 'data\processed_data\SBUX\4_2025-02-19.md'
Converted 'data\edgar_documents\SBUX\4_2025-03-14' --> 'data\processed_data\SBUX\4_2025-03-14.md'


2025-11-14 17:33:05,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:05,670 - INFO - Going to convert document batch...
2025-11-14 17:33:05,671 - INFO - Processing document 4_2025-03-26
2025-11-14 17:33:05,691 - INFO - Finished converting document 4_2025-03-26 in 0.05 sec.


Converted 'data\edgar_documents\SBUX\4_2025-03-18' --> 'data\processed_data\SBUX\4_2025-03-18.md'
Converted 'data\edgar_documents\SBUX\4_2025-03-26' --> 'data\processed_data\SBUX\4_2025-03-26.md'


2025-11-14 17:33:05,875 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:33:05,876 - ERROR - Input document 4_2025-05-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:33:05,877 - INFO - Going to convert document batch...
2025-11-14 17:33:05,906 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:33:05,907 - ERROR - Input document 4_2025-05-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\SBUX\4_2025-05-06: File format not allowed: data\edgar_documents\SBUX\4_2025-05-06
Error processing data\edgar_documents\SBUX\4_2025-05-07: File format not allowed: data\edgar_documents\SBUX\4_2025-05-07
Converted 'data\edgar_documents\SBUX\4_2025-05-16' --> 'data\processed_data\SBUX\4_2025-05-16.md'
Converted 'data\edgar_documents\SBUX\4_2025-06-18' --> 'data\processed_data\SBUX\4_2025-06-18.md'


2025-11-14 17:33:06,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,103 - INFO - Going to convert document batch...
2025-11-14 17:33:06,105 - INFO - Processing document 4_2025-09-11
2025-11-14 17:33:06,124 - INFO - Finished converting document 4_2025-09-11 in 0.05 sec.
2025-11-14 17:33:06,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,165 - INFO - Going to convert document batch...
2025-11-14 17:33:06,166 - INFO - Processing document 4_2025-09-17
2025-11-14 17:33:06,186 - INFO - Finished converting document 4_2025-09-17 in 0.05 sec.
2025-11-14 17:33:06,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,254 - INFO - Going to convert document batch...
2025-11-14 17:33:06,255 - INFO - Processing document 8-K_2023-02-02
2025-11-14 17:33:06,273 - INFO - Finished converting document 8-K_2023-02-02 in 0.06 sec.


Converted 'data\edgar_documents\SBUX\4_2025-07-03' --> 'data\processed_data\SBUX\4_2025-07-03.md'
Converted 'data\edgar_documents\SBUX\4_2025-09-11' --> 'data\processed_data\SBUX\4_2025-09-11.md'
Converted 'data\edgar_documents\SBUX\4_2025-09-17' --> 'data\processed_data\SBUX\4_2025-09-17.md'


2025-11-14 17:33:06,296 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,308 - INFO - Going to convert document batch...
2025-11-14 17:33:06,309 - INFO - Processing document 8-K_2023-02-16
2025-11-14 17:33:06,331 - INFO - Finished converting document 8-K_2023-02-16 in 0.05 sec.
2025-11-14 17:33:06,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,374 - INFO - Going to convert document batch...
2025-11-14 17:33:06,375 - INFO - Processing document 8-K_2023-03-21
2025-11-14 17:33:06,394 - INFO - Finished converting document 8-K_2023-03-21 in 0.05 sec.
2025-11-14 17:33:06,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,429 - INFO - Going to convert document batch...
2025-11-14 17:33:06,430 - INFO - Processing document 8-K_2023-03-28
2025-11-14 17:33:06,449 - INFO - Finished converting document 8-K_2023-03-28 in 0.05 sec.
2025-11-14 17:33:06,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\8-K_2023-02-02' --> 'data\processed_data\SBUX\8-K_2023-02-02.md'
Converted 'data\edgar_documents\SBUX\8-K_2023-02-16' --> 'data\processed_data\SBUX\8-K_2023-02-16.md'
Converted 'data\edgar_documents\SBUX\8-K_2023-03-21' --> 'data\processed_data\SBUX\8-K_2023-03-21.md'
Converted 'data\edgar_documents\SBUX\8-K_2023-03-28' --> 'data\processed_data\SBUX\8-K_2023-03-28.md'


2025-11-14 17:33:06,496 - INFO - Going to convert document batch...
2025-11-14 17:33:06,497 - INFO - Processing document 8-K_2023-03-29
2025-11-14 17:33:06,544 - INFO - Finished converting document 8-K_2023-03-29 in 0.09 sec.
2025-11-14 17:33:06,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,586 - INFO - Going to convert document batch...
2025-11-14 17:33:06,588 - INFO - Processing document 8-K_2023-04-21
2025-11-14 17:33:06,614 - INFO - Finished converting document 8-K_2023-04-21 in 0.05 sec.
2025-11-14 17:33:06,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,679 - INFO - Going to convert document batch...
2025-11-14 17:33:06,679 - INFO - Processing document 8-K_2023-05-02
2025-11-14 17:33:06,700 - INFO - Finished converting document 8-K_2023-05-02 in 0.06 sec.
2025-11-14 17:33:06,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,734 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SBUX\8-K_2023-03-29' --> 'data\processed_data\SBUX\8-K_2023-03-29.md'
Converted 'data\edgar_documents\SBUX\8-K_2023-04-21' --> 'data\processed_data\SBUX\8-K_2023-04-21.md'
Converted 'data\edgar_documents\SBUX\8-K_2023-05-02' --> 'data\processed_data\SBUX\8-K_2023-05-02.md'


2025-11-14 17:33:06,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,791 - INFO - Going to convert document batch...
2025-11-14 17:33:06,792 - INFO - Processing document 8-K_2023-09-13
2025-11-14 17:33:06,815 - INFO - Finished converting document 8-K_2023-09-13 in 0.05 sec.
2025-11-14 17:33:06,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,853 - INFO - Going to convert document batch...
2025-11-14 17:33:06,854 - INFO - Processing document 8-K_2023-11-02
2025-11-14 17:33:06,876 - INFO - Finished converting document 8-K_2023-11-02 in 0.05 sec.
2025-11-14 17:33:06,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:06,914 - INFO - Going to convert document batch...
2025-11-14 17:33:06,915 - INFO - Processing document 8-K_2023-11-20
2025-11-14 17:33:06,934 - INFO - Finished converting document 8-K_2023-11-20 in 0.05 sec.
2025-11-14 17:33:06,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\8-K_2023-08-01' --> 'data\processed_data\SBUX\8-K_2023-08-01.md'
Converted 'data\edgar_documents\SBUX\8-K_2023-09-13' --> 'data\processed_data\SBUX\8-K_2023-09-13.md'
Converted 'data\edgar_documents\SBUX\8-K_2023-11-02' --> 'data\processed_data\SBUX\8-K_2023-11-02.md'
Converted 'data\edgar_documents\SBUX\8-K_2023-11-20' --> 'data\processed_data\SBUX\8-K_2023-11-20.md'


2025-11-14 17:33:06,970 - INFO - Going to convert document batch...
2025-11-14 17:33:06,971 - INFO - Processing document 8-K_2024-01-09
2025-11-14 17:33:06,991 - INFO - Finished converting document 8-K_2024-01-09 in 0.05 sec.
2025-11-14 17:33:07,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,024 - INFO - Going to convert document batch...
2025-11-14 17:33:07,025 - INFO - Processing document 8-K_2024-01-30
2025-11-14 17:33:07,046 - INFO - Finished converting document 8-K_2024-01-30 in 0.05 sec.
2025-11-14 17:33:07,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,080 - INFO - Going to convert document batch...
2025-11-14 17:33:07,080 - INFO - Processing document 8-K_2024-02-08
2025-11-14 17:33:07,104 - INFO - Finished converting document 8-K_2024-02-08 in 0.06 sec.
2025-11-14 17:33:07,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,153 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SBUX\8-K_2024-01-09' --> 'data\processed_data\SBUX\8-K_2024-01-09.md'
Converted 'data\edgar_documents\SBUX\8-K_2024-01-30' --> 'data\processed_data\SBUX\8-K_2024-01-30.md'
Converted 'data\edgar_documents\SBUX\8-K_2024-02-08' --> 'data\processed_data\SBUX\8-K_2024-02-08.md'


2025-11-14 17:33:07,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,222 - INFO - Going to convert document batch...
2025-11-14 17:33:07,223 - INFO - Processing document 8-K_2024-04-30
2025-11-14 17:33:07,242 - INFO - Finished converting document 8-K_2024-04-30 in 0.03 sec.
2025-11-14 17:33:07,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,290 - INFO - Going to convert document batch...
2025-11-14 17:33:07,292 - INFO - Processing document 8-K_2024-05-31
2025-11-14 17:33:07,312 - INFO - Finished converting document 8-K_2024-05-31 in 0.06 sec.
2025-11-14 17:33:07,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,347 - INFO - Going to convert document batch...
2025-11-14 17:33:07,347 - INFO - Processing document 8-K_2024-07-30
2025-11-14 17:33:07,365 - INFO - Finished converting document 8-K_2024-07-30 in 0.03 sec.


Converted 'data\edgar_documents\SBUX\8-K_2024-03-15' --> 'data\processed_data\SBUX\8-K_2024-03-15.md'
Converted 'data\edgar_documents\SBUX\8-K_2024-04-30' --> 'data\processed_data\SBUX\8-K_2024-04-30.md'
Converted 'data\edgar_documents\SBUX\8-K_2024-05-31' --> 'data\processed_data\SBUX\8-K_2024-05-31.md'
Converted 'data\edgar_documents\SBUX\8-K_2024-07-30' --> 'data\processed_data\SBUX\8-K_2024-07-30.md'


2025-11-14 17:33:07,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,399 - INFO - Going to convert document batch...
2025-11-14 17:33:07,400 - INFO - Processing document 8-K_2024-08-14
2025-11-14 17:33:07,419 - INFO - Finished converting document 8-K_2024-08-14 in 0.05 sec.
2025-11-14 17:33:07,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,455 - INFO - Going to convert document batch...
2025-11-14 17:33:07,456 - INFO - Processing document 8-K_2024-09-16
2025-11-14 17:33:07,474 - INFO - Finished converting document 8-K_2024-09-16 in 0.03 sec.
2025-11-14 17:33:07,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,505 - INFO - Going to convert document batch...
2025-11-14 17:33:07,506 - INFO - Processing document 8-K_2024-10-22
2025-11-14 17:33:07,524 - INFO - Finished converting document 8-K_2024-10-22 in 0.03 sec.
2025-11-14 17:33:07,546 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\SBUX\8-K_2024-08-14' --> 'data\processed_data\SBUX\8-K_2024-08-14.md'
Converted 'data\edgar_documents\SBUX\8-K_2024-09-16' --> 'data\processed_data\SBUX\8-K_2024-09-16.md'
Converted 'data\edgar_documents\SBUX\8-K_2024-10-22' --> 'data\processed_data\SBUX\8-K_2024-10-22.md'
Converted 'data\edgar_documents\SBUX\8-K_2024-10-30' --> 'data\processed_data\SBUX\8-K_2024-10-30.md'


2025-11-14 17:33:07,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,655 - INFO - Going to convert document batch...
2025-11-14 17:33:07,656 - INFO - Processing document 8-K_2025-01-16
2025-11-14 17:33:07,678 - INFO - Finished converting document 8-K_2025-01-16 in 0.05 sec.
2025-11-14 17:33:07,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,710 - INFO - Going to convert document batch...
2025-11-14 17:33:07,711 - INFO - Processing document 8-K_2025-01-17
2025-11-14 17:33:07,729 - INFO - Finished converting document 8-K_2025-01-17 in 0.05 sec.
2025-11-14 17:33:07,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,763 - INFO - Going to convert document batch...
2025-11-14 17:33:07,764 - INFO - Processing document 8-K_2025-01-28
2025-11-14 17:33:07,783 - INFO - Finished converting document 8-K_2025-01-28 in 0.05 sec.
2025-11-14 17:33:07,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SBUX\8-K_2024-11-21' --> 'data\processed_data\SBUX\8-K_2024-11-21.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-01-16' --> 'data\processed_data\SBUX\8-K_2025-01-16.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-01-17' --> 'data\processed_data\SBUX\8-K_2025-01-17.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-01-28' --> 'data\processed_data\SBUX\8-K_2025-01-28.md'


2025-11-14 17:33:07,818 - INFO - Going to convert document batch...
2025-11-14 17:33:07,818 - INFO - Processing document 8-K_2025-03-04
2025-11-14 17:33:07,842 - INFO - Finished converting document 8-K_2025-03-04 in 0.05 sec.
2025-11-14 17:33:07,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,882 - INFO - Going to convert document batch...
2025-11-14 17:33:07,884 - INFO - Processing document 8-K_2025-03-07
2025-11-14 17:33:07,912 - INFO - Finished converting document 8-K_2025-03-07 in 0.05 sec.
2025-11-14 17:33:07,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:07,966 - INFO - Going to convert document batch...
2025-11-14 17:33:07,967 - INFO - Processing document 8-K_2025-03-14
2025-11-14 17:33:08,001 - INFO - Finished converting document 8-K_2025-03-14 in 0.08 sec.
2025-11-14 17:33:08,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,038 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SBUX\8-K_2025-03-04' --> 'data\processed_data\SBUX\8-K_2025-03-04.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-03-07' --> 'data\processed_data\SBUX\8-K_2025-03-07.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-03-14' --> 'data\processed_data\SBUX\8-K_2025-03-14.md'


2025-11-14 17:33:08,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,090 - INFO - Going to convert document batch...
2025-11-14 17:33:08,092 - INFO - Processing document 8-K_2025-04-29
2025-11-14 17:33:08,113 - INFO - Finished converting document 8-K_2025-04-29 in 0.05 sec.
2025-11-14 17:33:08,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,151 - INFO - Going to convert document batch...
2025-11-14 17:33:08,152 - INFO - Processing document 8-K_2025-05-08
2025-11-14 17:33:08,184 - INFO - Finished converting document 8-K_2025-05-08 in 0.06 sec.
2025-11-14 17:33:08,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,244 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SBUX\8-K_2025-04-23' --> 'data\processed_data\SBUX\8-K_2025-04-23.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-04-29' --> 'data\processed_data\SBUX\8-K_2025-04-29.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-05-08' --> 'data\processed_data\SBUX\8-K_2025-05-08.md'


2025-11-14 17:33:08,246 - INFO - Processing document 8-K_2025-06-04
2025-11-14 17:33:08,270 - INFO - Finished converting document 8-K_2025-06-04 in 0.06 sec.
2025-11-14 17:33:08,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,307 - INFO - Going to convert document batch...
2025-11-14 17:33:08,308 - INFO - Processing document 8-K_2025-06-16
2025-11-14 17:33:08,334 - INFO - Finished converting document 8-K_2025-06-16 in 0.05 sec.
2025-11-14 17:33:08,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,377 - INFO - Going to convert document batch...
2025-11-14 17:33:08,378 - INFO - Processing document 8-K_2025-06-26
2025-11-14 17:33:08,397 - INFO - Finished converting document 8-K_2025-06-26 in 0.05 sec.
2025-11-14 17:33:08,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,429 - INFO - Going to convert document batch...
2025-11-14 17:33:08,429 - INFO - Processing document 8-K_2025-06-30
2025-11-14 17:

Converted 'data\edgar_documents\SBUX\8-K_2025-06-04' --> 'data\processed_data\SBUX\8-K_2025-06-04.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-06-16' --> 'data\processed_data\SBUX\8-K_2025-06-16.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-06-26' --> 'data\processed_data\SBUX\8-K_2025-06-26.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-06-30' --> 'data\processed_data\SBUX\8-K_2025-06-30.md'


2025-11-14 17:33:08,483 - INFO - Going to convert document batch...
2025-11-14 17:33:08,483 - INFO - Processing document 8-K_2025-07-02
2025-11-14 17:33:08,502 - INFO - Finished converting document 8-K_2025-07-02 in 0.05 sec.
2025-11-14 17:33:08,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,537 - INFO - Going to convert document batch...
2025-11-14 17:33:08,538 - INFO - Processing document 8-K_2025-07-29
2025-11-14 17:33:08,559 - INFO - Finished converting document 8-K_2025-07-29 in 0.05 sec.
2025-11-14 17:33:08,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,592 - INFO - Going to convert document batch...
2025-11-14 17:33:08,592 - INFO - Processing document 8-K_2025-09-25
2025-11-14 17:33:08,613 - INFO - Finished converting document 8-K_2025-09-25 in 0.05 sec.
2025-11-14 17:33:08,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:08,646 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SBUX\8-K_2025-07-02' --> 'data\processed_data\SBUX\8-K_2025-07-02.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-07-29' --> 'data\processed_data\SBUX\8-K_2025-07-29.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-09-25' --> 'data\processed_data\SBUX\8-K_2025-09-25.md'
Converted 'data\edgar_documents\SBUX\8-K_2025-10-29' --> 'data\processed_data\SBUX\8-K_2025-10-29.md'


2025-11-14 17:33:08,698 - INFO - Processing document 8-K_2025-11-03
2025-11-14 17:33:08,717 - INFO - Finished converting document 8-K_2025-11-03 in 0.05 sec.
2025-11-14 17:33:08,765 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:33:08,766 - ERROR - Input document DEF-14A_2023-01-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:33:08,768 - INFO - Going to convert document batch...
2025-11-14 17:33:08,875 - INFO - detected formats:

Converted 'data\edgar_documents\SBUX\8-K_2025-11-03' --> 'data\processed_data\SBUX\8-K_2025-11-03.md'
Error processing data\edgar_documents\SBUX\DEF-14A_2023-01-27: File format not allowed: data\edgar_documents\SBUX\DEF-14A_2023-01-27
Error processing data\edgar_documents\SBUX\DEF-14A_2025-01-24: File format not allowed: data\edgar_documents\SBUX\DEF-14A_2025-01-24
Processed 103 new files. Errors: 10
Found 204 files to process in data\edgar_documents\SCHW


2025-11-14 17:33:09,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:33:10,730 - INFO - Going to convert document batch...
2025-11-14 17:33:10,731 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:33:10,732 - INFO - Processing document 10-K_2023-02-24
2025-11-14 17:33:15,346 - INFO - Finished converting document 10-K_2023-02-24 in 6.44 sec.
2025-11-14 17:33:16,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-K_2023-02-24' --> 'data\processed_data\SCHW\10-K_2023-02-24.md'


2025-11-14 17:33:18,341 - INFO - Going to convert document batch...
2025-11-14 17:33:18,342 - INFO - Processing document 10-K_2024-02-23
2025-11-14 17:33:23,155 - INFO - Finished converting document 10-K_2024-02-23 in 6.83 sec.
2025-11-14 17:33:24,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-K_2024-02-23' --> 'data\processed_data\SCHW\10-K_2024-02-23.md'


2025-11-14 17:33:26,163 - INFO - Going to convert document batch...
2025-11-14 17:33:26,164 - INFO - Processing document 10-K_2025-02-26
2025-11-14 17:33:31,115 - INFO - Finished converting document 10-K_2025-02-26 in 6.95 sec.
2025-11-14 17:33:32,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-K_2025-02-26' --> 'data\processed_data\SCHW\10-K_2025-02-26.md'


2025-11-14 17:33:33,779 - INFO - Going to convert document batch...
2025-11-14 17:33:33,780 - INFO - Processing document 10-Q_2023-05-08
2025-11-14 17:33:35,683 - INFO - Finished converting document 10-Q_2023-05-08 in 3.52 sec.
2025-11-14 17:33:36,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-Q_2023-05-08' --> 'data\processed_data\SCHW\10-Q_2023-05-08.md'


2025-11-14 17:33:38,182 - INFO - Going to convert document batch...
2025-11-14 17:33:38,183 - INFO - Processing document 10-Q_2023-08-08
2025-11-14 17:33:40,527 - INFO - Finished converting document 10-Q_2023-08-08 in 4.14 sec.
2025-11-14 17:33:42,002 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-Q_2023-08-08' --> 'data\processed_data\SCHW\10-Q_2023-08-08.md'


2025-11-14 17:33:43,412 - INFO - Going to convert document batch...
2025-11-14 17:33:43,413 - INFO - Processing document 10-Q_2023-11-08
2025-11-14 17:33:45,885 - INFO - Finished converting document 10-Q_2023-11-08 in 3.98 sec.
2025-11-14 17:33:46,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-Q_2023-11-08' --> 'data\processed_data\SCHW\10-Q_2023-11-08.md'


2025-11-14 17:33:47,667 - INFO - Going to convert document batch...
2025-11-14 17:33:47,668 - INFO - Processing document 10-Q_2024-05-09
2025-11-14 17:33:50,275 - INFO - Finished converting document 10-Q_2024-05-09 in 3.55 sec.
2025-11-14 17:33:51,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-Q_2024-05-09' --> 'data\processed_data\SCHW\10-Q_2024-05-09.md'


2025-11-14 17:33:52,733 - INFO - Going to convert document batch...
2025-11-14 17:33:52,734 - INFO - Processing document 10-Q_2024-08-08
2025-11-14 17:33:55,126 - INFO - Finished converting document 10-Q_2024-08-08 in 4.14 sec.
2025-11-14 17:33:56,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-Q_2024-08-08' --> 'data\processed_data\SCHW\10-Q_2024-08-08.md'


2025-11-14 17:33:57,675 - INFO - Going to convert document batch...
2025-11-14 17:33:57,675 - INFO - Processing document 10-Q_2024-11-08
2025-11-14 17:34:00,095 - INFO - Finished converting document 10-Q_2024-11-08 in 4.17 sec.
2025-11-14 17:34:00,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-Q_2024-11-08' --> 'data\processed_data\SCHW\10-Q_2024-11-08.md'


2025-11-14 17:34:02,440 - INFO - Going to convert document batch...
2025-11-14 17:34:02,442 - INFO - Processing document 10-Q_2025-05-09
2025-11-14 17:34:04,313 - INFO - Finished converting document 10-Q_2025-05-09 in 3.42 sec.
2025-11-14 17:34:05,086 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-Q_2025-05-09' --> 'data\processed_data\SCHW\10-Q_2025-05-09.md'


2025-11-14 17:34:06,756 - INFO - Going to convert document batch...
2025-11-14 17:34:06,756 - INFO - Processing document 10-Q_2025-08-08
2025-11-14 17:34:09,057 - INFO - Finished converting document 10-Q_2025-08-08 in 4.06 sec.
2025-11-14 17:34:10,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-Q_2025-08-08' --> 'data\processed_data\SCHW\10-Q_2025-08-08.md'


2025-11-14 17:34:11,480 - INFO - Going to convert document batch...
2025-11-14 17:34:11,482 - INFO - Processing document 10-Q_2025-11-07
2025-11-14 17:34:13,804 - INFO - Finished converting document 10-Q_2025-11-07 in 3.97 sec.
2025-11-14 17:34:14,609 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:14,620 - INFO - Going to convert document batch...
2025-11-14 17:34:14,620 - INFO - Processing document 4_2023-01-05
2025-11-14 17:34:14,640 - INFO - Finished converting document 4_2023-01-05 in 0.06 sec.
2025-11-14 17:34:14,680 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:14,691 - INFO - Going to convert document batch...
2025-11-14 17:34:14,691 - INFO - Processing document 4_2023-01-20
2025-11-14 17:34:14,712 - INFO - Finished converting document 4_2023-01-20 in 0.03 sec.
2025-11-14 17:34:14,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\10-Q_2025-11-07' --> 'data\processed_data\SCHW\10-Q_2025-11-07.md'
Converted 'data\edgar_documents\SCHW\4_2023-01-05' --> 'data\processed_data\SCHW\4_2023-01-05.md'
Converted 'data\edgar_documents\SCHW\4_2023-01-20' --> 'data\processed_data\SCHW\4_2023-01-20.md'


2025-11-14 17:34:14,779 - INFO - Going to convert document batch...
2025-11-14 17:34:14,780 - INFO - Processing document 4_2023-02-02
2025-11-14 17:34:14,804 - INFO - Finished converting document 4_2023-02-02 in 0.06 sec.
2025-11-14 17:34:14,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:14,849 - INFO - Going to convert document batch...
2025-11-14 17:34:14,850 - INFO - Processing document 4_2023-02-07
2025-11-14 17:34:14,872 - INFO - Finished converting document 4_2023-02-07 in 0.05 sec.
2025-11-14 17:34:14,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:14,955 - INFO - Going to convert document batch...
2025-11-14 17:34:14,956 - INFO - Processing document 4_2023-02-08
2025-11-14 17:34:15,006 - INFO - Finished converting document 4_2023-02-08 in 0.11 sec.


Converted 'data\edgar_documents\SCHW\4_2023-02-02' --> 'data\processed_data\SCHW\4_2023-02-02.md'
Converted 'data\edgar_documents\SCHW\4_2023-02-07' --> 'data\processed_data\SCHW\4_2023-02-07.md'


2025-11-14 17:34:15,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:15,054 - INFO - Going to convert document batch...
2025-11-14 17:34:15,055 - INFO - Processing document 4_2023-02-09
2025-11-14 17:34:15,078 - INFO - Finished converting document 4_2023-02-09 in 0.05 sec.
2025-11-14 17:34:15,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:15,140 - INFO - Going to convert document batch...
2025-11-14 17:34:15,141 - INFO - Processing document 4_2023-02-15
2025-11-14 17:34:15,164 - INFO - Finished converting document 4_2023-02-15 in 0.06 sec.
2025-11-14 17:34:15,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2023-02-08' --> 'data\processed_data\SCHW\4_2023-02-08.md'
Converted 'data\edgar_documents\SCHW\4_2023-02-09' --> 'data\processed_data\SCHW\4_2023-02-09.md'
Converted 'data\edgar_documents\SCHW\4_2023-02-15' --> 'data\processed_data\SCHW\4_2023-02-15.md'


2025-11-14 17:34:15,229 - INFO - Going to convert document batch...
2025-11-14 17:34:15,231 - INFO - Processing document 4_2023-02-16
2025-11-14 17:34:15,806 - INFO - Finished converting document 4_2023-02-16 in 0.59 sec.
2025-11-14 17:34:15,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:15,868 - INFO - Going to convert document batch...
2025-11-14 17:34:15,869 - INFO - Processing document 4_2023-02-21
2025-11-14 17:34:15,889 - INFO - Finished converting document 4_2023-02-21 in 0.06 sec.
2025-11-14 17:34:15,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:15,950 - INFO - Going to convert document batch...
2025-11-14 17:34:15,951 - INFO - Processing document 4_2023-02-28
2025-11-14 17:34:15,969 - INFO - Finished converting document 4_2023-02-28 in 0.06 sec.
2025-11-14 17:34:15,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,006 - INFO - Going to convert document batch...
2025-11-14 17:34:16,007 - 

Converted 'data\edgar_documents\SCHW\4_2023-02-16' --> 'data\processed_data\SCHW\4_2023-02-16.md'
Converted 'data\edgar_documents\SCHW\4_2023-02-21' --> 'data\processed_data\SCHW\4_2023-02-21.md'
Converted 'data\edgar_documents\SCHW\4_2023-02-28' --> 'data\processed_data\SCHW\4_2023-02-28.md'


2025-11-14 17:34:16,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,063 - INFO - Going to convert document batch...
2025-11-14 17:34:16,064 - INFO - Processing document 4_2023-03-06
2025-11-14 17:34:16,088 - INFO - Finished converting document 4_2023-03-06 in 0.03 sec.
2025-11-14 17:34:16,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,148 - INFO - Going to convert document batch...
2025-11-14 17:34:16,149 - INFO - Processing document 4_2023-03-14
2025-11-14 17:34:16,169 - INFO - Finished converting document 4_2023-03-14 in 0.06 sec.
2025-11-14 17:34:16,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,208 - INFO - Going to convert document batch...
2025-11-14 17:34:16,208 - INFO - Processing document 4_2023-03-15
2025-11-14 17:34:16,226 - INFO - Finished converting document 4_2023-03-15 in 0.03 sec.


Converted 'data\edgar_documents\SCHW\4_2023-03-03' --> 'data\processed_data\SCHW\4_2023-03-03.md'
Converted 'data\edgar_documents\SCHW\4_2023-03-06' --> 'data\processed_data\SCHW\4_2023-03-06.md'
Converted 'data\edgar_documents\SCHW\4_2023-03-14' --> 'data\processed_data\SCHW\4_2023-03-14.md'


2025-11-14 17:34:16,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,267 - INFO - Going to convert document batch...
2025-11-14 17:34:16,268 - INFO - Processing document 4_2023-03-16
2025-11-14 17:34:16,287 - INFO - Finished converting document 4_2023-03-16 in 0.03 sec.
2025-11-14 17:34:16,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,330 - INFO - Going to convert document batch...
2025-11-14 17:34:16,331 - INFO - Processing document 4_2023-03-17
2025-11-14 17:34:16,348 - INFO - Finished converting document 4_2023-03-17 in 0.03 sec.
2025-11-14 17:34:16,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,390 - INFO - Going to convert document batch...
2025-11-14 17:34:16,391 - INFO - Processing document 4_2023-03-20
2025-11-14 17:34:16,411 - INFO - Finished converting document 4_2023-03-20 in 0.05 sec.
2025-11-14 17:34:16,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2023-03-15' --> 'data\processed_data\SCHW\4_2023-03-15.md'
Converted 'data\edgar_documents\SCHW\4_2023-03-16' --> 'data\processed_data\SCHW\4_2023-03-16.md'
Converted 'data\edgar_documents\SCHW\4_2023-03-17' --> 'data\processed_data\SCHW\4_2023-03-17.md'
Converted 'data\edgar_documents\SCHW\4_2023-03-20' --> 'data\processed_data\SCHW\4_2023-03-20.md'


2025-11-14 17:34:16,456 - INFO - Going to convert document batch...
2025-11-14 17:34:16,457 - INFO - Processing document 4_2023-03-29
2025-11-14 17:34:16,474 - INFO - Finished converting document 4_2023-03-29 in 0.03 sec.
2025-11-14 17:34:16,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,533 - INFO - Going to convert document batch...
2025-11-14 17:34:16,534 - INFO - Processing document 4_2023-04-05
2025-11-14 17:34:16,566 - INFO - Finished converting document 4_2023-04-05 in 0.06 sec.
2025-11-14 17:34:16,649 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:34:16,651 - ERROR - Input document 4_2023-05-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\SCHW\4_2023-03-29' --> 'data\processed_data\SCHW\4_2023-03-29.md'
Converted 'data\edgar_documents\SCHW\4_2023-04-05' --> 'data\processed_data\SCHW\4_2023-04-05.md'
Error processing data\edgar_documents\SCHW\4_2023-05-17: File format not allowed: data\edgar_documents\SCHW\4_2023-05-17


2025-11-14 17:34:16,698 - INFO - Finished converting document 4_2023-05-19 in 0.05 sec.
2025-11-14 17:34:16,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,742 - INFO - Going to convert document batch...
2025-11-14 17:34:16,743 - INFO - Processing document 4_2023-05-23
2025-11-14 17:34:16,766 - INFO - Finished converting document 4_2023-05-23 in 0.05 sec.
2025-11-14 17:34:16,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,827 - INFO - Going to convert document batch...
2025-11-14 17:34:16,827 - INFO - Processing document 4_2023-05-24
2025-11-14 17:34:16,849 - INFO - Finished converting document 4_2023-05-24 in 0.05 sec.
2025-11-14 17:34:16,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2023-05-19' --> 'data\processed_data\SCHW\4_2023-05-19.md'
Converted 'data\edgar_documents\SCHW\4_2023-05-23' --> 'data\processed_data\SCHW\4_2023-05-23.md'
Converted 'data\edgar_documents\SCHW\4_2023-05-24' --> 'data\processed_data\SCHW\4_2023-05-24.md'


2025-11-14 17:34:16,914 - INFO - Going to convert document batch...
2025-11-14 17:34:16,915 - INFO - Processing document 4_2023-06-07
2025-11-14 17:34:16,933 - INFO - Finished converting document 4_2023-06-07 in 0.06 sec.
2025-11-14 17:34:16,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:16,984 - INFO - Going to convert document batch...
2025-11-14 17:34:16,985 - INFO - Processing document 4_2023-07-06
2025-11-14 17:34:17,006 - INFO - Finished converting document 4_2023-07-06 in 0.05 sec.
2025-11-14 17:34:17,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,050 - INFO - Going to convert document batch...
2025-11-14 17:34:17,051 - INFO - Processing document 4_2023-07-26
2025-11-14 17:34:17,076 - INFO - Finished converting document 4_2023-07-26 in 0.05 sec.
2025-11-14 17:34:17,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,119 - INFO - Going to convert document batch...
2025-11-14 17:34:17,120 - 

Converted 'data\edgar_documents\SCHW\4_2023-06-07' --> 'data\processed_data\SCHW\4_2023-06-07.md'
Converted 'data\edgar_documents\SCHW\4_2023-07-06' --> 'data\processed_data\SCHW\4_2023-07-06.md'
Converted 'data\edgar_documents\SCHW\4_2023-07-26' --> 'data\processed_data\SCHW\4_2023-07-26.md'


2025-11-14 17:34:17,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,179 - INFO - Going to convert document batch...
2025-11-14 17:34:17,181 - INFO - Processing document 4_2023-08-11
2025-11-14 17:34:17,202 - INFO - Finished converting document 4_2023-08-11 in 0.05 sec.
2025-11-14 17:34:17,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,243 - INFO - Going to convert document batch...
2025-11-14 17:34:17,244 - INFO - Processing document 4_2023-08-21
2025-11-14 17:34:17,263 - INFO - Finished converting document 4_2023-08-21 in 0.05 sec.
2025-11-14 17:34:17,307 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:34:17,308 - ERROR - Input document 4_2023-08-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\SCHW\4_2023-08-03' --> 'data\processed_data\SCHW\4_2023-08-03.md'
Converted 'data\edgar_documents\SCHW\4_2023-08-11' --> 'data\processed_data\SCHW\4_2023-08-11.md'
Converted 'data\edgar_documents\SCHW\4_2023-08-21' --> 'data\processed_data\SCHW\4_2023-08-21.md'
Error processing data\edgar_documents\SCHW\4_2023-08-22: File format not allowed: data\edgar_documents\SCHW\4_2023-08-22
Error processing data\edgar_documents\SCHW\4_2023-08-24: File format not allowed: data\edgar_documents\SCHW\4_2023-08-24


2025-11-14 17:34:17,353 - INFO - Going to convert document batch...
2025-11-14 17:34:17,354 - INFO - Processing document 4_2023-08-30
2025-11-14 17:34:17,377 - INFO - Finished converting document 4_2023-08-30 in 0.05 sec.
2025-11-14 17:34:17,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,440 - INFO - Going to convert document batch...
2025-11-14 17:34:17,442 - INFO - Processing document 4_2023-09-20
2025-11-14 17:34:17,469 - INFO - Finished converting document 4_2023-09-20 in 0.06 sec.
2025-11-14 17:34:17,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,515 - INFO - Going to convert document batch...
2025-11-14 17:34:17,516 - INFO - Processing document 4_2023-10-04
2025-11-14 17:34:17,537 - INFO - Finished converting document 4_2023-10-04 in 0.05 sec.
2025-11-14 17:34:17,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,594 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\4_2023-08-30' --> 'data\processed_data\SCHW\4_2023-08-30.md'
Converted 'data\edgar_documents\SCHW\4_2023-09-20' --> 'data\processed_data\SCHW\4_2023-09-20.md'
Converted 'data\edgar_documents\SCHW\4_2023-10-04' --> 'data\processed_data\SCHW\4_2023-10-04.md'


2025-11-14 17:34:17,595 - INFO - Processing document 4_2023-10-23
2025-11-14 17:34:17,618 - INFO - Finished converting document 4_2023-10-23 in 0.05 sec.
2025-11-14 17:34:17,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,662 - INFO - Going to convert document batch...
2025-11-14 17:34:17,663 - INFO - Processing document 4_2023-10-26
2025-11-14 17:34:17,683 - INFO - Finished converting document 4_2023-10-26 in 0.05 sec.
2025-11-14 17:34:17,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,725 - INFO - Going to convert document batch...
2025-11-14 17:34:17,725 - INFO - Processing document 4_2023-11-01
2025-11-14 17:34:17,745 - INFO - Finished converting document 4_2023-11-01 in 0.05 sec.
2025-11-14 17:34:17,777 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,786 - INFO - Going to convert document batch...
2025-11-14 17:34:17,786 - INFO - Processing document 4_2023-11-03
2025-11-14 17:34:17,806 - IN

Converted 'data\edgar_documents\SCHW\4_2023-10-23' --> 'data\processed_data\SCHW\4_2023-10-23.md'
Converted 'data\edgar_documents\SCHW\4_2023-10-26' --> 'data\processed_data\SCHW\4_2023-10-26.md'
Converted 'data\edgar_documents\SCHW\4_2023-11-01' --> 'data\processed_data\SCHW\4_2023-11-01.md'
Converted 'data\edgar_documents\SCHW\4_2023-11-03' --> 'data\processed_data\SCHW\4_2023-11-03.md'


2025-11-14 17:34:17,859 - INFO - Going to convert document batch...
2025-11-14 17:34:17,860 - INFO - Processing document 4_2023-11-06
2025-11-14 17:34:17,880 - INFO - Finished converting document 4_2023-11-06 in 0.05 sec.
2025-11-14 17:34:17,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:17,924 - INFO - Going to convert document batch...
2025-11-14 17:34:17,925 - INFO - Processing document 4_2023-11-07
2025-11-14 17:34:17,945 - INFO - Finished converting document 4_2023-11-07 in 0.03 sec.
2025-11-14 17:34:18,030 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:34:18,031 - ERROR - Input document 4_2023-11-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\SCHW\4_2023-11-06' --> 'data\processed_data\SCHW\4_2023-11-06.md'
Converted 'data\edgar_documents\SCHW\4_2023-11-07' --> 'data\processed_data\SCHW\4_2023-11-07.md'
Error processing data\edgar_documents\SCHW\4_2023-11-15: File format not allowed: data\edgar_documents\SCHW\4_2023-11-15
Error processing data\edgar_documents\SCHW\4_2023-11-17: File format not allowed: data\edgar_documents\SCHW\4_2023-11-17


2025-11-14 17:34:18,102 - INFO - Finished converting document 4_2023-12-04 in 0.03 sec.
2025-11-14 17:34:18,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,145 - INFO - Going to convert document batch...
2025-11-14 17:34:18,146 - INFO - Processing document 4_2023-12-19
2025-11-14 17:34:18,171 - INFO - Finished converting document 4_2023-12-19 in 0.05 sec.
2025-11-14 17:34:18,206 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,216 - INFO - Going to convert document batch...
2025-11-14 17:34:18,216 - INFO - Processing document 4_2024-01-04
2025-11-14 17:34:18,236 - INFO - Finished converting document 4_2024-01-04 in 0.05 sec.
2025-11-14 17:34:18,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,276 - INFO - Going to convert document batch...
2025-11-14 17:34:18,276 - INFO - Processing document 4_2024-01-24
2025-11-14 17:34:18,294 - INFO - Finished converting document 4_2024-01-24 in 0.05 sec.


Converted 'data\edgar_documents\SCHW\4_2023-12-04' --> 'data\processed_data\SCHW\4_2023-12-04.md'
Converted 'data\edgar_documents\SCHW\4_2023-12-19' --> 'data\processed_data\SCHW\4_2023-12-19.md'
Converted 'data\edgar_documents\SCHW\4_2024-01-04' --> 'data\processed_data\SCHW\4_2024-01-04.md'


2025-11-14 17:34:18,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,335 - INFO - Going to convert document batch...
2025-11-14 17:34:18,337 - INFO - Processing document 4_2024-01-26
2025-11-14 17:34:18,358 - INFO - Finished converting document 4_2024-01-26 in 0.05 sec.
2025-11-14 17:34:18,391 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,402 - INFO - Going to convert document batch...
2025-11-14 17:34:18,403 - INFO - Processing document 4_2024-02-05
2025-11-14 17:34:18,428 - INFO - Finished converting document 4_2024-02-05 in 0.05 sec.
2025-11-14 17:34:18,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,472 - INFO - Going to convert document batch...
2025-11-14 17:34:18,472 - INFO - Processing document 4_2024-02-12
2025-11-14 17:34:18,492 - INFO - Finished converting document 4_2024-02-12 in 0.03 sec.


Converted 'data\edgar_documents\SCHW\4_2024-01-24' --> 'data\processed_data\SCHW\4_2024-01-24.md'
Converted 'data\edgar_documents\SCHW\4_2024-01-26' --> 'data\processed_data\SCHW\4_2024-01-26.md'
Converted 'data\edgar_documents\SCHW\4_2024-02-05' --> 'data\processed_data\SCHW\4_2024-02-05.md'


2025-11-14 17:34:18,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,538 - INFO - Going to convert document batch...
2025-11-14 17:34:18,539 - INFO - Processing document 4_2024-02-20
2025-11-14 17:34:18,576 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.
2025-11-14 17:34:18,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,635 - INFO - Going to convert document batch...
2025-11-14 17:34:18,636 - INFO - Processing document 4_2024-02-26
2025-11-14 17:34:18,659 - INFO - Finished converting document 4_2024-02-26 in 0.05 sec.
2025-11-14 17:34:18,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,703 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\4_2024-02-12' --> 'data\processed_data\SCHW\4_2024-02-12.md'
Converted 'data\edgar_documents\SCHW\4_2024-02-20' --> 'data\processed_data\SCHW\4_2024-02-20.md'
Converted 'data\edgar_documents\SCHW\4_2024-02-26' --> 'data\processed_data\SCHW\4_2024-02-26.md'


2025-11-14 17:34:18,704 - INFO - Processing document 4_2024-03-01
2025-11-14 17:34:18,725 - INFO - Finished converting document 4_2024-03-01 in 0.03 sec.
2025-11-14 17:34:18,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,773 - INFO - Going to convert document batch...
2025-11-14 17:34:18,774 - INFO - Processing document 4_2024-03-05
2025-11-14 17:34:18,805 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 17:34:18,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,860 - INFO - Going to convert document batch...
2025-11-14 17:34:18,861 - INFO - Processing document 4_2024-03-08
2025-11-14 17:34:18,883 - INFO - Finished converting document 4_2024-03-08 in 0.05 sec.
2025-11-14 17:34:18,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,925 - INFO - Going to convert document batch...
2025-11-14 17:34:18,925 - INFO - Processing document 4_2024-03-25
2025-11-14 17:34:18,949 - IN

Converted 'data\edgar_documents\SCHW\4_2024-03-01' --> 'data\processed_data\SCHW\4_2024-03-01.md'
Converted 'data\edgar_documents\SCHW\4_2024-03-05' --> 'data\processed_data\SCHW\4_2024-03-05.md'
Converted 'data\edgar_documents\SCHW\4_2024-03-08' --> 'data\processed_data\SCHW\4_2024-03-08.md'


2025-11-14 17:34:18,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:18,995 - INFO - Going to convert document batch...
2025-11-14 17:34:18,996 - INFO - Processing document 4_2024-03-26
2025-11-14 17:34:19,022 - INFO - Finished converting document 4_2024-03-26 in 0.05 sec.
2025-11-14 17:34:19,059 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,069 - INFO - Going to convert document batch...
2025-11-14 17:34:19,070 - INFO - Processing document 4_2024-03-28
2025-11-14 17:34:19,094 - INFO - Finished converting document 4_2024-03-28 in 0.05 sec.
2025-11-14 17:34:19,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,138 - INFO - Going to convert document batch...
2025-11-14 17:34:19,139 - INFO - Processing document 4_2024-04-03


Converted 'data\edgar_documents\SCHW\4_2024-03-25' --> 'data\processed_data\SCHW\4_2024-03-25.md'
Converted 'data\edgar_documents\SCHW\4_2024-03-26' --> 'data\processed_data\SCHW\4_2024-03-26.md'
Converted 'data\edgar_documents\SCHW\4_2024-03-28' --> 'data\processed_data\SCHW\4_2024-03-28.md'


2025-11-14 17:34:19,158 - INFO - Finished converting document 4_2024-04-03 in 0.05 sec.
2025-11-14 17:34:19,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,200 - INFO - Going to convert document batch...
2025-11-14 17:34:19,201 - INFO - Processing document 4_2024-04-18
2025-11-14 17:34:19,225 - INFO - Finished converting document 4_2024-04-18 in 0.05 sec.
2025-11-14 17:34:19,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,276 - INFO - Going to convert document batch...
2025-11-14 17:34:19,277 - INFO - Processing document 4_2024-04-22
2025-11-14 17:34:19,305 - INFO - Finished converting document 4_2024-04-22 in 0.05 sec.
2025-11-14 17:34:19,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2024-04-03' --> 'data\processed_data\SCHW\4_2024-04-03.md'
Converted 'data\edgar_documents\SCHW\4_2024-04-18' --> 'data\processed_data\SCHW\4_2024-04-18.md'
Converted 'data\edgar_documents\SCHW\4_2024-04-22' --> 'data\processed_data\SCHW\4_2024-04-22.md'


2025-11-14 17:34:19,370 - INFO - Going to convert document batch...
2025-11-14 17:34:19,371 - INFO - Processing document 4_2024-04-23
2025-11-14 17:34:19,403 - INFO - Finished converting document 4_2024-04-23 in 0.08 sec.
2025-11-14 17:34:19,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,453 - INFO - Going to convert document batch...
2025-11-14 17:34:19,454 - INFO - Processing document 4_2024-04-24
2025-11-14 17:34:19,474 - INFO - Finished converting document 4_2024-04-24 in 0.03 sec.
2025-11-14 17:34:19,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,515 - INFO - Going to convert document batch...
2025-11-14 17:34:19,516 - INFO - Processing document 4_2024-04-26
2025-11-14 17:34:19,538 - INFO - Finished converting document 4_2024-04-26 in 0.05 sec.
2025-11-14 17:34:19,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,581 - INFO - Going to convert document batch...
2025-11-14 17:34:19,582 - 

Converted 'data\edgar_documents\SCHW\4_2024-04-23' --> 'data\processed_data\SCHW\4_2024-04-23.md'
Converted 'data\edgar_documents\SCHW\4_2024-04-24' --> 'data\processed_data\SCHW\4_2024-04-24.md'
Converted 'data\edgar_documents\SCHW\4_2024-04-26' --> 'data\processed_data\SCHW\4_2024-04-26.md'


2025-11-14 17:34:19,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,645 - INFO - Going to convert document batch...
2025-11-14 17:34:19,646 - INFO - Processing document 4_2024-05-08
2025-11-14 17:34:19,666 - INFO - Finished converting document 4_2024-05-08 in 0.05 sec.
2025-11-14 17:34:19,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,736 - INFO - Going to convert document batch...
2025-11-14 17:34:19,737 - INFO - Processing document 4_2024-05-10
2025-11-14 17:34:19,763 - INFO - Finished converting document 4_2024-05-10 in 0.06 sec.
2025-11-14 17:34:19,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:19,806 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\4_2024-04-30' --> 'data\processed_data\SCHW\4_2024-04-30.md'
Converted 'data\edgar_documents\SCHW\4_2024-05-08' --> 'data\processed_data\SCHW\4_2024-05-08.md'
Converted 'data\edgar_documents\SCHW\4_2024-05-10' --> 'data\processed_data\SCHW\4_2024-05-10.md'


2025-11-14 17:34:19,807 - INFO - Processing document 4_2024-05-13
2025-11-14 17:34:20,051 - INFO - Finished converting document 4_2024-05-13 in 0.27 sec.
2025-11-14 17:34:20,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,096 - INFO - Going to convert document batch...
2025-11-14 17:34:20,097 - INFO - Processing document 4_2024-05-16
2025-11-14 17:34:20,119 - INFO - Finished converting document 4_2024-05-16 in 0.05 sec.
2025-11-14 17:34:20,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,159 - INFO - Going to convert document batch...
2025-11-14 17:34:20,159 - INFO - Processing document 4_2024-05-21
2025-11-14 17:34:20,180 - INFO - Finished converting document 4_2024-05-21 in 0.03 sec.
2025-11-14 17:34:20,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,236 - INFO - Going to convert document batch...
2025-11-14 17:34:20,237 - INFO - Processing document 4_2024-05-22
2025-11-14 17:34:20,257 - IN

Converted 'data\edgar_documents\SCHW\4_2024-05-13' --> 'data\processed_data\SCHW\4_2024-05-13.md'
Converted 'data\edgar_documents\SCHW\4_2024-05-16' --> 'data\processed_data\SCHW\4_2024-05-16.md'
Converted 'data\edgar_documents\SCHW\4_2024-05-21' --> 'data\processed_data\SCHW\4_2024-05-21.md'


2025-11-14 17:34:20,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,299 - INFO - Going to convert document batch...
2025-11-14 17:34:20,300 - INFO - Processing document 4_2024-05-24
2025-11-14 17:34:20,318 - INFO - Finished converting document 4_2024-05-24 in 0.03 sec.
2025-11-14 17:34:20,354 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,365 - INFO - Going to convert document batch...
2025-11-14 17:34:20,366 - INFO - Processing document 4_2024-05-30
2025-11-14 17:34:20,393 - INFO - Finished converting document 4_2024-05-30 in 0.05 sec.
2025-11-14 17:34:20,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,440 - INFO - Going to convert document batch...
2025-11-14 17:34:20,441 - INFO - Processing document 4_2024-05-31
2025-11-14 17:34:20,462 - INFO - Finished converting document 4_2024-05-31 in 0.03 sec.


Converted 'data\edgar_documents\SCHW\4_2024-05-22' --> 'data\processed_data\SCHW\4_2024-05-22.md'
Converted 'data\edgar_documents\SCHW\4_2024-05-24' --> 'data\processed_data\SCHW\4_2024-05-24.md'
Converted 'data\edgar_documents\SCHW\4_2024-05-30' --> 'data\processed_data\SCHW\4_2024-05-30.md'


2025-11-14 17:34:20,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,508 - INFO - Going to convert document batch...
2025-11-14 17:34:20,509 - INFO - Processing document 4_2024-06-14
2025-11-14 17:34:20,536 - INFO - Finished converting document 4_2024-06-14 in 0.05 sec.
2025-11-14 17:34:20,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,582 - INFO - Going to convert document batch...
2025-11-14 17:34:20,583 - INFO - Processing document 4_2024-06-24
2025-11-14 17:34:20,606 - INFO - Finished converting document 4_2024-06-24 in 0.05 sec.
2025-11-14 17:34:20,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,670 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\4_2024-05-31' --> 'data\processed_data\SCHW\4_2024-05-31.md'
Converted 'data\edgar_documents\SCHW\4_2024-06-14' --> 'data\processed_data\SCHW\4_2024-06-14.md'
Converted 'data\edgar_documents\SCHW\4_2024-06-24' --> 'data\processed_data\SCHW\4_2024-06-24.md'


2025-11-14 17:34:20,671 - INFO - Processing document 4_2024-07-03
2025-11-14 17:34:20,696 - INFO - Finished converting document 4_2024-07-03 in 0.06 sec.
2025-11-14 17:34:20,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,743 - INFO - Going to convert document batch...
2025-11-14 17:34:20,744 - INFO - Processing document 4_2024-07-15
2025-11-14 17:34:20,767 - INFO - Finished converting document 4_2024-07-15 in 0.05 sec.
2025-11-14 17:34:20,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,810 - INFO - Going to convert document batch...
2025-11-14 17:34:20,811 - INFO - Processing document 4_2024-07-19
2025-11-14 17:34:20,832 - INFO - Finished converting document 4_2024-07-19 in 0.05 sec.
2025-11-14 17:34:20,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,890 - INFO - Going to convert document batch...
2025-11-14 17:34:20,891 - INFO - Processing document 4_2024-07-23


Converted 'data\edgar_documents\SCHW\4_2024-07-03' --> 'data\processed_data\SCHW\4_2024-07-03.md'
Converted 'data\edgar_documents\SCHW\4_2024-07-15' --> 'data\processed_data\SCHW\4_2024-07-15.md'
Converted 'data\edgar_documents\SCHW\4_2024-07-19' --> 'data\processed_data\SCHW\4_2024-07-19.md'


2025-11-14 17:34:20,917 - INFO - Finished converting document 4_2024-07-23 in 0.06 sec.
2025-11-14 17:34:20,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:20,964 - INFO - Going to convert document batch...
2025-11-14 17:34:20,965 - INFO - Processing document 4_2024-08-02
2025-11-14 17:34:20,989 - INFO - Finished converting document 4_2024-08-02 in 0.05 sec.
2025-11-14 17:34:21,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,034 - INFO - Going to convert document batch...
2025-11-14 17:34:21,035 - INFO - Processing document 4_2024-08-19
2025-11-14 17:34:21,057 - INFO - Finished converting document 4_2024-08-19 in 0.05 sec.
2025-11-14 17:34:21,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,102 - INFO - Going to convert document batch...
2025-11-14 17:34:21,104 - INFO - Processing document 4_2024-09-20
2025-11-14 17:34:21,124 - INFO - Finished converting document 4_2024-09-20 in 0.05 sec.


Converted 'data\edgar_documents\SCHW\4_2024-07-23' --> 'data\processed_data\SCHW\4_2024-07-23.md'
Converted 'data\edgar_documents\SCHW\4_2024-08-02' --> 'data\processed_data\SCHW\4_2024-08-02.md'
Converted 'data\edgar_documents\SCHW\4_2024-08-19' --> 'data\processed_data\SCHW\4_2024-08-19.md'


2025-11-14 17:34:21,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,169 - INFO - Going to convert document batch...
2025-11-14 17:34:21,169 - INFO - Processing document 4_2024-10-03
2025-11-14 17:34:21,188 - INFO - Finished converting document 4_2024-10-03 in 0.05 sec.
2025-11-14 17:34:21,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,233 - INFO - Going to convert document batch...
2025-11-14 17:34:21,234 - INFO - Processing document 4_2024-10-17
2025-11-14 17:34:21,260 - INFO - Finished converting document 4_2024-10-17 in 0.06 sec.
2025-11-14 17:34:21,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,305 - INFO - Going to convert document batch...
2025-11-14 17:34:21,306 - INFO - Processing document 4_2024-10-18
2025-11-14 17:34:21,327 - INFO - Finished converting document 4_2024-10-18 in 0.05 sec.


Converted 'data\edgar_documents\SCHW\4_2024-09-20' --> 'data\processed_data\SCHW\4_2024-09-20.md'
Converted 'data\edgar_documents\SCHW\4_2024-10-03' --> 'data\processed_data\SCHW\4_2024-10-03.md'
Converted 'data\edgar_documents\SCHW\4_2024-10-17' --> 'data\processed_data\SCHW\4_2024-10-17.md'


2025-11-14 17:34:21,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,371 - INFO - Going to convert document batch...
2025-11-14 17:34:21,371 - INFO - Processing document 4_2024-10-22
2025-11-14 17:34:21,396 - INFO - Finished converting document 4_2024-10-22 in 0.05 sec.
2025-11-14 17:34:21,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,452 - INFO - Going to convert document batch...
2025-11-14 17:34:21,453 - INFO - Processing document 4_2024-10-28
2025-11-14 17:34:21,482 - INFO - Finished converting document 4_2024-10-28 in 0.06 sec.
2025-11-14 17:34:21,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2024-10-18' --> 'data\processed_data\SCHW\4_2024-10-18.md'
Converted 'data\edgar_documents\SCHW\4_2024-10-22' --> 'data\processed_data\SCHW\4_2024-10-22.md'
Converted 'data\edgar_documents\SCHW\4_2024-10-28' --> 'data\processed_data\SCHW\4_2024-10-28.md'


2025-11-14 17:34:21,550 - INFO - Going to convert document batch...
2025-11-14 17:34:21,551 - INFO - Processing document 4_2024-11-08
2025-11-14 17:34:21,574 - INFO - Finished converting document 4_2024-11-08 in 0.06 sec.
2025-11-14 17:34:21,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,623 - INFO - Going to convert document batch...
2025-11-14 17:34:21,624 - INFO - Processing document 4_2024-11-12
2025-11-14 17:34:21,649 - INFO - Finished converting document 4_2024-11-12 in 0.05 sec.
2025-11-14 17:34:21,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,693 - INFO - Going to convert document batch...
2025-11-14 17:34:21,694 - INFO - Processing document 4_2024-11-14
2025-11-14 17:34:21,720 - INFO - Finished converting document 4_2024-11-14 in 0.05 sec.
2025-11-14 17:34:21,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,765 - INFO - Going to convert document batch...
2025-11-14 17:34:21,766 - 

Converted 'data\edgar_documents\SCHW\4_2024-11-08' --> 'data\processed_data\SCHW\4_2024-11-08.md'
Converted 'data\edgar_documents\SCHW\4_2024-11-12' --> 'data\processed_data\SCHW\4_2024-11-12.md'
Converted 'data\edgar_documents\SCHW\4_2024-11-14' --> 'data\processed_data\SCHW\4_2024-11-14.md'


2025-11-14 17:34:21,820 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,829 - INFO - Going to convert document batch...
2025-11-14 17:34:21,830 - INFO - Processing document 4_2024-11-19
2025-11-14 17:34:21,859 - INFO - Finished converting document 4_2024-11-19 in 0.05 sec.
2025-11-14 17:34:21,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:21,929 - INFO - Going to convert document batch...
2025-11-14 17:34:21,930 - INFO - Processing document 4_2024-11-20
2025-11-14 17:34:21,957 - INFO - Finished converting document 4_2024-11-20 in 0.06 sec.
2025-11-14 17:34:22,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2024-11-18' --> 'data\processed_data\SCHW\4_2024-11-18.md'
Converted 'data\edgar_documents\SCHW\4_2024-11-19' --> 'data\processed_data\SCHW\4_2024-11-19.md'
Converted 'data\edgar_documents\SCHW\4_2024-11-20' --> 'data\processed_data\SCHW\4_2024-11-20.md'


2025-11-14 17:34:22,020 - INFO - Going to convert document batch...
2025-11-14 17:34:22,021 - INFO - Processing document 4_2024-11-26
2025-11-14 17:34:22,042 - INFO - Finished converting document 4_2024-11-26 in 0.06 sec.
2025-11-14 17:34:22,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:22,088 - INFO - Going to convert document batch...
2025-11-14 17:34:22,089 - INFO - Processing document 4_2024-11-27
2025-11-14 17:34:22,113 - INFO - Finished converting document 4_2024-11-27 in 0.05 sec.
2025-11-14 17:34:22,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:22,155 - INFO - Going to convert document batch...
2025-11-14 17:34:22,156 - INFO - Processing document 4_2024-11-29
2025-11-14 17:34:22,175 - INFO - Finished converting document 4_2024-11-29 in 0.03 sec.
2025-11-14 17:34:22,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:22,222 - INFO - Going to convert document batch...
2025-11-14 17:34:22,223 - 

Converted 'data\edgar_documents\SCHW\4_2024-11-26' --> 'data\processed_data\SCHW\4_2024-11-26.md'
Converted 'data\edgar_documents\SCHW\4_2024-11-27' --> 'data\processed_data\SCHW\4_2024-11-27.md'
Converted 'data\edgar_documents\SCHW\4_2024-11-29' --> 'data\processed_data\SCHW\4_2024-11-29.md'


2025-11-14 17:34:22,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:22,290 - INFO - Going to convert document batch...
2025-11-14 17:34:22,292 - INFO - Processing document 4_2024-12-19
2025-11-14 17:34:22,323 - INFO - Finished converting document 4_2024-12-19 in 0.06 sec.
2025-11-14 17:34:22,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:22,381 - INFO - Going to convert document batch...
2025-11-14 17:34:22,381 - INFO - Processing document 4_2025-01-03
2025-11-14 17:34:22,406 - INFO - Finished converting document 4_2025-01-03 in 0.06 sec.
2025-11-14 17:34:22,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:22,455 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\4_2024-12-17' --> 'data\processed_data\SCHW\4_2024-12-17.md'
Converted 'data\edgar_documents\SCHW\4_2024-12-19' --> 'data\processed_data\SCHW\4_2024-12-19.md'
Converted 'data\edgar_documents\SCHW\4_2025-01-03' --> 'data\processed_data\SCHW\4_2025-01-03.md'


2025-11-14 17:34:22,456 - INFO - Processing document 4_2025-01-06
2025-11-14 17:34:22,481 - INFO - Finished converting document 4_2025-01-06 in 0.06 sec.
2025-11-14 17:34:22,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:22,552 - INFO - Going to convert document batch...
2025-11-14 17:34:22,554 - INFO - Processing document 4_2025-01-24
2025-11-14 17:34:22,585 - INFO - Finished converting document 4_2025-01-24 in 0.06 sec.
2025-11-14 17:34:22,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:22,641 - INFO - Going to convert document batch...
2025-11-14 17:34:22,642 - INFO - Processing document 4_2025-01-27
2025-11-14 17:34:22,665 - INFO - Finished converting document 4_2025-01-27 in 0.05 sec.
2025-11-14 17:34:22,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2025-01-06' --> 'data\processed_data\SCHW\4_2025-01-06.md'
Converted 'data\edgar_documents\SCHW\4_2025-01-24' --> 'data\processed_data\SCHW\4_2025-01-24.md'
Converted 'data\edgar_documents\SCHW\4_2025-01-27' --> 'data\processed_data\SCHW\4_2025-01-27.md'


2025-11-14 17:34:22,708 - INFO - Going to convert document batch...
2025-11-14 17:34:22,709 - INFO - Processing document 4_2025-02-07
2025-11-14 17:34:22,730 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.
2025-11-14 17:34:22,774 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:34:22,775 - ERROR - Input document 4_2025-02-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:34:22,776 - INFO - Going to convert document batch...
2025-11-14 17:34:22,798 - IN

Converted 'data\edgar_documents\SCHW\4_2025-02-07' --> 'data\processed_data\SCHW\4_2025-02-07.md'
Error processing data\edgar_documents\SCHW\4_2025-02-10: File format not allowed: data\edgar_documents\SCHW\4_2025-02-10
Error processing data\edgar_documents\SCHW\4_2025-02-11: File format not allowed: data\edgar_documents\SCHW\4_2025-02-11
Converted 'data\edgar_documents\SCHW\4_2025-02-14' --> 'data\processed_data\SCHW\4_2025-02-14.md'
Converted 'data\edgar_documents\SCHW\4_2025-02-19' --> 'data\processed_data\SCHW\4_2025-02-19.md'


2025-11-14 17:34:22,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:22,981 - INFO - Going to convert document batch...
2025-11-14 17:34:22,981 - INFO - Processing document 4_2025-02-25
2025-11-14 17:34:23,004 - INFO - Finished converting document 4_2025-02-25 in 0.06 sec.
2025-11-14 17:34:23,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:23,050 - INFO - Going to convert document batch...
2025-11-14 17:34:23,050 - INFO - Processing document 4_2025-03-03
2025-11-14 17:34:23,070 - INFO - Finished converting document 4_2025-03-03 in 0.03 sec.
2025-11-14 17:34:23,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:23,132 - INFO - Going to convert document batch...
2025-11-14 17:34:23,132 - INFO - Processing document 4_2025-03-04
2025-11-14 17:34:23,151 - INFO - Finished converting document 4_2025-03-04 in 0.06 sec.
2025-11-14 17:34:23,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\SCHW\4_2025-02-25' --> 'data\processed_data\SCHW\4_2025-02-25.md'
Converted 'data\edgar_documents\SCHW\4_2025-03-03' --> 'data\processed_data\SCHW\4_2025-03-03.md'
Converted 'data\edgar_documents\SCHW\4_2025-03-04' --> 'data\processed_data\SCHW\4_2025-03-04.md'


2025-11-14 17:34:23,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:23,256 - INFO - Going to convert document batch...
2025-11-14 17:34:23,257 - INFO - Processing document 4_2025-03-10
2025-11-14 17:34:23,305 - INFO - Finished converting document 4_2025-03-10 in 0.06 sec.
2025-11-14 17:34:23,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:23,364 - INFO - Going to convert document batch...
2025-11-14 17:34:23,365 - INFO - Processing document 4_2025-03-17
2025-11-14 17:34:23,394 - INFO - Finished converting document 4_2025-03-17 in 0.06 sec.
2025-11-14 17:34:23,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2025-03-07' --> 'data\processed_data\SCHW\4_2025-03-07.md'
Converted 'data\edgar_documents\SCHW\4_2025-03-10' --> 'data\processed_data\SCHW\4_2025-03-10.md'
Converted 'data\edgar_documents\SCHW\4_2025-03-17' --> 'data\processed_data\SCHW\4_2025-03-17.md'


2025-11-14 17:34:23,443 - INFO - Going to convert document batch...
2025-11-14 17:34:23,444 - INFO - Processing document 4_2025-03-27
2025-11-14 17:34:23,468 - INFO - Finished converting document 4_2025-03-27 in 0.05 sec.
2025-11-14 17:34:23,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:23,517 - INFO - Going to convert document batch...
2025-11-14 17:34:23,518 - INFO - Processing document 4_2025-04-02
2025-11-14 17:34:23,541 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.
2025-11-14 17:34:23,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:23,582 - INFO - Going to convert document batch...
2025-11-14 17:34:23,582 - INFO - Processing document 4_2025-04-03
2025-11-14 17:34:23,604 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.
2025-11-14 17:34:23,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:23,672 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\4_2025-03-27' --> 'data\processed_data\SCHW\4_2025-03-27.md'
Converted 'data\edgar_documents\SCHW\4_2025-04-02' --> 'data\processed_data\SCHW\4_2025-04-02.md'
Converted 'data\edgar_documents\SCHW\4_2025-04-03' --> 'data\processed_data\SCHW\4_2025-04-03.md'


2025-11-14 17:34:23,673 - INFO - Processing document 4_2025-04-07
2025-11-14 17:34:23,697 - INFO - Finished converting document 4_2025-04-07 in 0.06 sec.
2025-11-14 17:34:23,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:23,748 - INFO - Going to convert document batch...
2025-11-14 17:34:23,748 - INFO - Processing document 4_2025-04-22
2025-11-14 17:34:23,773 - INFO - Finished converting document 4_2025-04-22 in 0.05 sec.
2025-11-14 17:34:23,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2025-04-07' --> 'data\processed_data\SCHW\4_2025-04-07.md'
Converted 'data\edgar_documents\SCHW\4_2025-04-22' --> 'data\processed_data\SCHW\4_2025-04-22.md'


2025-11-14 17:34:24,055 - INFO - Going to convert document batch...
2025-11-14 17:34:24,055 - INFO - Processing document 4_2025-04-24
2025-11-14 17:34:24,078 - INFO - Finished converting document 4_2025-04-24 in 0.28 sec.
2025-11-14 17:34:24,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,134 - INFO - Going to convert document batch...
2025-11-14 17:34:24,136 - INFO - Processing document 4_2025-04-29
2025-11-14 17:34:24,172 - INFO - Finished converting document 4_2025-04-29 in 0.08 sec.
2025-11-14 17:34:24,206 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,214 - INFO - Going to convert document batch...
2025-11-14 17:34:24,215 - INFO - Processing document 4_2025-05-01
2025-11-14 17:34:24,237 - INFO - Finished converting document 4_2025-05-01 in 0.05 sec.
2025-11-14 17:34:24,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,279 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\4_2025-04-24' --> 'data\processed_data\SCHW\4_2025-04-24.md'
Converted 'data\edgar_documents\SCHW\4_2025-04-29' --> 'data\processed_data\SCHW\4_2025-04-29.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-01' --> 'data\processed_data\SCHW\4_2025-05-01.md'


2025-11-14 17:34:24,280 - INFO - Processing document 4_2025-05-02
2025-11-14 17:34:24,302 - INFO - Finished converting document 4_2025-05-02 in 0.05 sec.
2025-11-14 17:34:24,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,350 - INFO - Going to convert document batch...
2025-11-14 17:34:24,351 - INFO - Processing document 4_2025-05-05
2025-11-14 17:34:24,379 - INFO - Finished converting document 4_2025-05-05 in 0.05 sec.
2025-11-14 17:34:24,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,446 - INFO - Going to convert document batch...
2025-11-14 17:34:24,447 - INFO - Processing document 4_2025-05-06
2025-11-14 17:34:24,469 - INFO - Finished converting document 4_2025-05-06 in 0.06 sec.
2025-11-14 17:34:24,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,509 - INFO - Going to convert document batch...
2025-11-14 17:34:24,510 - INFO - Processing document 4_2025-05-07


Converted 'data\edgar_documents\SCHW\4_2025-05-02' --> 'data\processed_data\SCHW\4_2025-05-02.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-05' --> 'data\processed_data\SCHW\4_2025-05-05.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-06' --> 'data\processed_data\SCHW\4_2025-05-06.md'


2025-11-14 17:34:24,529 - INFO - Finished converting document 4_2025-05-07 in 0.05 sec.
2025-11-14 17:34:24,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,570 - INFO - Going to convert document batch...
2025-11-14 17:34:24,572 - INFO - Processing document 4_2025-05-09
2025-11-14 17:34:24,619 - INFO - Finished converting document 4_2025-05-09 in 0.06 sec.
2025-11-14 17:34:24,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,672 - INFO - Going to convert document batch...
2025-11-14 17:34:24,673 - INFO - Processing document 4_2025-05-12
2025-11-14 17:34:24,695 - INFO - Finished converting document 4_2025-05-12 in 0.05 sec.
2025-11-14 17:34:24,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2025-05-07' --> 'data\processed_data\SCHW\4_2025-05-07.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-09' --> 'data\processed_data\SCHW\4_2025-05-09.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-12' --> 'data\processed_data\SCHW\4_2025-05-12.md'


2025-11-14 17:34:24,739 - INFO - Going to convert document batch...
2025-11-14 17:34:24,739 - INFO - Processing document 4_2025-05-14
2025-11-14 17:34:24,763 - INFO - Finished converting document 4_2025-05-14 in 0.05 sec.
2025-11-14 17:34:24,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,822 - INFO - Going to convert document batch...
2025-11-14 17:34:24,822 - INFO - Processing document 4_2025-05-19
2025-11-14 17:34:24,844 - INFO - Finished converting document 4_2025-05-19 in 0.06 sec.
2025-11-14 17:34:24,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,888 - INFO - Going to convert document batch...
2025-11-14 17:34:24,888 - INFO - Processing document 4_2025-05-20
2025-11-14 17:34:24,910 - INFO - Finished converting document 4_2025-05-20 in 0.05 sec.
2025-11-14 17:34:24,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:24,952 - INFO - Going to convert document batch...
2025-11-14 17:34:24,952 - 

Converted 'data\edgar_documents\SCHW\4_2025-05-14' --> 'data\processed_data\SCHW\4_2025-05-14.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-19' --> 'data\processed_data\SCHW\4_2025-05-19.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-20' --> 'data\processed_data\SCHW\4_2025-05-20.md'


2025-11-14 17:34:25,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,019 - INFO - Going to convert document batch...
2025-11-14 17:34:25,020 - INFO - Processing document 4_2025-05-23
2025-11-14 17:34:25,043 - INFO - Finished converting document 4_2025-05-23 in 0.05 sec.
2025-11-14 17:34:25,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,114 - INFO - Going to convert document batch...
2025-11-14 17:34:25,115 - INFO - Processing document 4_2025-05-27
2025-11-14 17:34:25,147 - INFO - Finished converting document 4_2025-05-27 in 0.06 sec.
2025-11-14 17:34:25,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2025-05-22' --> 'data\processed_data\SCHW\4_2025-05-22.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-23' --> 'data\processed_data\SCHW\4_2025-05-23.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-27' --> 'data\processed_data\SCHW\4_2025-05-27.md'


2025-11-14 17:34:25,196 - INFO - Going to convert document batch...
2025-11-14 17:34:25,197 - INFO - Processing document 4_2025-05-29
2025-11-14 17:34:25,223 - INFO - Finished converting document 4_2025-05-29 in 0.05 sec.
2025-11-14 17:34:25,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,270 - INFO - Going to convert document batch...
2025-11-14 17:34:25,270 - INFO - Processing document 4_2025-05-30
2025-11-14 17:34:25,294 - INFO - Finished converting document 4_2025-05-30 in 0.05 sec.
2025-11-14 17:34:25,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,340 - INFO - Going to convert document batch...
2025-11-14 17:34:25,341 - INFO - Processing document 4_2025-06-02
2025-11-14 17:34:25,359 - INFO - Finished converting document 4_2025-06-02 in 0.05 sec.
2025-11-14 17:34:25,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,420 - INFO - Going to convert document batch...
2025-11-14 17:34:25,421 - 

Converted 'data\edgar_documents\SCHW\4_2025-05-29' --> 'data\processed_data\SCHW\4_2025-05-29.md'
Converted 'data\edgar_documents\SCHW\4_2025-05-30' --> 'data\processed_data\SCHW\4_2025-05-30.md'
Converted 'data\edgar_documents\SCHW\4_2025-06-02' --> 'data\processed_data\SCHW\4_2025-06-02.md'


2025-11-14 17:34:25,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,499 - INFO - Going to convert document batch...
2025-11-14 17:34:25,500 - INFO - Processing document 4_2025-06-04
2025-11-14 17:34:25,519 - INFO - Finished converting document 4_2025-06-04 in 0.05 sec.
2025-11-14 17:34:25,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,564 - INFO - Going to convert document batch...
2025-11-14 17:34:25,565 - INFO - Processing document 4_2025-06-06
2025-11-14 17:34:25,586 - INFO - Finished converting document 4_2025-06-06 in 0.03 sec.
2025-11-14 17:34:25,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,650 - INFO - Going to convert document batch...
2025-11-14 17:34:25,651 - INFO - Processing document 4_2025-06-20


Converted 'data\edgar_documents\SCHW\4_2025-06-03' --> 'data\processed_data\SCHW\4_2025-06-03.md'
Converted 'data\edgar_documents\SCHW\4_2025-06-04' --> 'data\processed_data\SCHW\4_2025-06-04.md'
Converted 'data\edgar_documents\SCHW\4_2025-06-06' --> 'data\processed_data\SCHW\4_2025-06-06.md'


2025-11-14 17:34:25,682 - INFO - Finished converting document 4_2025-06-20 in 0.08 sec.
2025-11-14 17:34:25,721 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,732 - INFO - Going to convert document batch...
2025-11-14 17:34:25,733 - INFO - Processing document 4_2025-06-26
2025-11-14 17:34:25,755 - INFO - Finished converting document 4_2025-06-26 in 0.05 sec.
2025-11-14 17:34:25,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,803 - INFO - Going to convert document batch...
2025-11-14 17:34:25,804 - INFO - Processing document 4_2025-07-02
2025-11-14 17:34:25,824 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 17:34:25,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,868 - INFO - Going to convert document batch...
2025-11-14 17:34:25,869 - INFO - Processing document 4_2025-07-03
2025-11-14 17:34:25,889 - INFO - Finished converting document 4_2025-07-03 in 0.05 sec.


Converted 'data\edgar_documents\SCHW\4_2025-06-20' --> 'data\processed_data\SCHW\4_2025-06-20.md'
Converted 'data\edgar_documents\SCHW\4_2025-06-26' --> 'data\processed_data\SCHW\4_2025-06-26.md'
Converted 'data\edgar_documents\SCHW\4_2025-07-02' --> 'data\processed_data\SCHW\4_2025-07-02.md'


2025-11-14 17:34:25,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:25,947 - INFO - Going to convert document batch...
2025-11-14 17:34:25,947 - INFO - Processing document 4_2025-07-07
2025-11-14 17:34:25,970 - INFO - Finished converting document 4_2025-07-07 in 0.06 sec.
2025-11-14 17:34:26,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,016 - INFO - Going to convert document batch...
2025-11-14 17:34:26,017 - INFO - Processing document 4_2025-07-31
2025-11-14 17:34:26,043 - INFO - Finished converting document 4_2025-07-31 in 0.05 sec.


Converted 'data\edgar_documents\SCHW\4_2025-07-03' --> 'data\processed_data\SCHW\4_2025-07-03.md'
Converted 'data\edgar_documents\SCHW\4_2025-07-07' --> 'data\processed_data\SCHW\4_2025-07-07.md'
Converted 'data\edgar_documents\SCHW\4_2025-07-31' --> 'data\processed_data\SCHW\4_2025-07-31.md'


2025-11-14 17:34:26,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,112 - INFO - Going to convert document batch...
2025-11-14 17:34:26,113 - INFO - Processing document 4_2025-08-05
2025-11-14 17:34:26,140 - INFO - Finished converting document 4_2025-08-05 in 0.06 sec.
2025-11-14 17:34:26,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,192 - INFO - Going to convert document batch...
2025-11-14 17:34:26,194 - INFO - Processing document 4_2025-08-08
2025-11-14 17:34:26,225 - INFO - Finished converting document 4_2025-08-08 in 0.05 sec.
2025-11-14 17:34:26,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,298 - INFO - Going to convert document batch...
2025-11-14 17:34:26,299 - INFO - Processing document 4_2025-08-11
2025-11-14 17:34:26,326 - INFO - Finished converting document 4_2025-08-11 in 0.08 sec.
2025-11-14 17:34:26,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2025-08-05' --> 'data\processed_data\SCHW\4_2025-08-05.md'
Converted 'data\edgar_documents\SCHW\4_2025-08-08' --> 'data\processed_data\SCHW\4_2025-08-08.md'
Converted 'data\edgar_documents\SCHW\4_2025-08-11' --> 'data\processed_data\SCHW\4_2025-08-11.md'


2025-11-14 17:34:26,370 - INFO - Going to convert document batch...
2025-11-14 17:34:26,371 - INFO - Processing document 4_2025-08-27
2025-11-14 17:34:26,391 - INFO - Finished converting document 4_2025-08-27 in 0.05 sec.
2025-11-14 17:34:26,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,438 - INFO - Going to convert document batch...
2025-11-14 17:34:26,439 - INFO - Processing document 4_2025-08-28
2025-11-14 17:34:26,463 - INFO - Finished converting document 4_2025-08-28 in 0.06 sec.
2025-11-14 17:34:26,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,524 - INFO - Going to convert document batch...
2025-11-14 17:34:26,524 - INFO - Processing document 4_2025-08-29
2025-11-14 17:34:26,550 - INFO - Finished converting document 4_2025-08-29 in 0.06 sec.
2025-11-14 17:34:26,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,596 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\4_2025-08-27' --> 'data\processed_data\SCHW\4_2025-08-27.md'
Converted 'data\edgar_documents\SCHW\4_2025-08-28' --> 'data\processed_data\SCHW\4_2025-08-28.md'
Converted 'data\edgar_documents\SCHW\4_2025-08-29' --> 'data\processed_data\SCHW\4_2025-08-29.md'


2025-11-14 17:34:26,597 - INFO - Processing document 4_2025-09-03
2025-11-14 17:34:26,619 - INFO - Finished converting document 4_2025-09-03 in 0.05 sec.
2025-11-14 17:34:26,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,666 - INFO - Going to convert document batch...
2025-11-14 17:34:26,667 - INFO - Processing document 4_2025-09-05
2025-11-14 17:34:26,693 - INFO - Finished converting document 4_2025-09-05 in 0.05 sec.
2025-11-14 17:34:26,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,747 - INFO - Going to convert document batch...
2025-11-14 17:34:26,747 - INFO - Processing document 4_2025-09-26
2025-11-14 17:34:26,773 - INFO - Finished converting document 4_2025-09-26 in 0.05 sec.
2025-11-14 17:34:26,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\4_2025-09-03' --> 'data\processed_data\SCHW\4_2025-09-03.md'
Converted 'data\edgar_documents\SCHW\4_2025-09-05' --> 'data\processed_data\SCHW\4_2025-09-05.md'
Converted 'data\edgar_documents\SCHW\4_2025-09-26' --> 'data\processed_data\SCHW\4_2025-09-26.md'


2025-11-14 17:34:26,836 - INFO - Going to convert document batch...
2025-11-14 17:34:26,837 - INFO - Processing document 4_2025-10-02
2025-11-14 17:34:26,860 - INFO - Finished converting document 4_2025-10-02 in 0.06 sec.
2025-11-14 17:34:26,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:26,928 - INFO - Going to convert document batch...
2025-11-14 17:34:26,929 - INFO - Processing document 4_2025-10-03
2025-11-14 17:34:26,957 - INFO - Finished converting document 4_2025-10-03 in 0.06 sec.
2025-11-14 17:34:26,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,007 - INFO - Going to convert document batch...
2025-11-14 17:34:27,008 - INFO - Processing document 4_2025-10-24
2025-11-14 17:34:27,036 - INFO - Finished converting document 4_2025-10-24 in 0.05 sec.
2025-11-14 17:34:27,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,081 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\4_2025-10-02' --> 'data\processed_data\SCHW\4_2025-10-02.md'
Converted 'data\edgar_documents\SCHW\4_2025-10-03' --> 'data\processed_data\SCHW\4_2025-10-03.md'
Converted 'data\edgar_documents\SCHW\4_2025-10-24' --> 'data\processed_data\SCHW\4_2025-10-24.md'


2025-11-14 17:34:27,082 - INFO - Processing document 4_2025-10-30
2025-11-14 17:34:27,105 - INFO - Finished converting document 4_2025-10-30 in 0.05 sec.
2025-11-14 17:34:27,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,150 - INFO - Going to convert document batch...
2025-11-14 17:34:27,151 - INFO - Processing document 4_2025-11-10
2025-11-14 17:34:27,176 - INFO - Finished converting document 4_2025-11-10 in 0.05 sec.
2025-11-14 17:34:27,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,227 - INFO - Going to convert document batch...
2025-11-14 17:34:27,228 - INFO - Processing document 8-K_2023-01-18
2025-11-14 17:34:27,248 - INFO - Finished converting document 8-K_2023-01-18 in 0.05 sec.
2025-11-14 17:34:27,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,286 - INFO - Going to convert document batch...
2025-11-14 17:34:27,286 - INFO - Processing document 8-K_2023-01-31
2025-11-14 17:34:27,30

Converted 'data\edgar_documents\SCHW\4_2025-10-30' --> 'data\processed_data\SCHW\4_2025-10-30.md'
Converted 'data\edgar_documents\SCHW\4_2025-11-10' --> 'data\processed_data\SCHW\4_2025-11-10.md'
Converted 'data\edgar_documents\SCHW\8-K_2023-01-18' --> 'data\processed_data\SCHW\8-K_2023-01-18.md'


2025-11-14 17:34:27,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,341 - INFO - Going to convert document batch...
2025-11-14 17:34:27,342 - INFO - Processing document 8-K_2023-04-06
2025-11-14 17:34:27,358 - INFO - Finished converting document 8-K_2023-04-06 in 0.05 sec.
2025-11-14 17:34:27,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,412 - INFO - Going to convert document batch...
2025-11-14 17:34:27,413 - INFO - Processing document 8-K_2023-04-17
2025-11-14 17:34:27,435 - INFO - Finished converting document 8-K_2023-04-17 in 0.06 sec.
2025-11-14 17:34:27,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,503 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SCHW\8-K_2023-01-31' --> 'data\processed_data\SCHW\8-K_2023-01-31.md'
Converted 'data\edgar_documents\SCHW\8-K_2023-04-06' --> 'data\processed_data\SCHW\8-K_2023-04-06.md'
Converted 'data\edgar_documents\SCHW\8-K_2023-04-17' --> 'data\processed_data\SCHW\8-K_2023-04-17.md'


2025-11-14 17:34:27,504 - INFO - Processing document 8-K_2023-05-05
2025-11-14 17:34:27,528 - INFO - Finished converting document 8-K_2023-05-05 in 0.08 sec.
2025-11-14 17:34:27,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,578 - INFO - Going to convert document batch...
2025-11-14 17:34:27,579 - INFO - Processing document 8-K_2023-05-19
2025-11-14 17:34:27,604 - INFO - Finished converting document 8-K_2023-05-19 in 0.06 sec.
2025-11-14 17:34:27,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,665 - INFO - Going to convert document batch...
2025-11-14 17:34:27,666 - INFO - Processing document 8-K_2023-05-22
2025-11-14 17:34:27,707 - INFO - Finished converting document 8-K_2023-05-22 in 0.08 sec.
2025-11-14 17:34:27,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SCHW\8-K_2023-05-05' --> 'data\processed_data\SCHW\8-K_2023-05-05.md'
Converted 'data\edgar_documents\SCHW\8-K_2023-05-19' --> 'data\processed_data\SCHW\8-K_2023-05-19.md'
Converted 'data\edgar_documents\SCHW\8-K_2023-05-22' --> 'data\processed_data\SCHW\8-K_2023-05-22.md'


2025-11-14 17:34:27,755 - INFO - Going to convert document batch...
2025-11-14 17:34:27,755 - INFO - Processing document 8-K_2023-07-18
2025-11-14 17:34:27,775 - INFO - Finished converting document 8-K_2023-07-18 in 0.05 sec.
2025-11-14 17:34:27,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,813 - INFO - Going to convert document batch...
2025-11-14 17:34:27,814 - INFO - Processing document 8-K_2023-08-21
2025-11-14 17:34:27,829 - INFO - Finished converting document 8-K_2023-08-21 in 0.05 sec.
2025-11-14 17:34:27,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:27,863 - INFO - Going to convert document batch...
2025-11-14 17:34:27,864 - INFO - Processing document 8-K_2023-08-24
2025-11-14 17:34:28,108 - INFO - Finished converting document 8-K_2023-08-24 in 0.26 sec.


Converted 'data\edgar_documents\SCHW\8-K_2023-07-18' --> 'data\processed_data\SCHW\8-K_2023-07-18.md'
Converted 'data\edgar_documents\SCHW\8-K_2023-08-21' --> 'data\processed_data\SCHW\8-K_2023-08-21.md'


2025-11-14 17:34:28,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,145 - INFO - Going to convert document batch...
2025-11-14 17:34:28,147 - INFO - Processing document 8-K_2023-10-16
2025-11-14 17:34:28,164 - INFO - Finished converting document 8-K_2023-10-16 in 0.03 sec.
2025-11-14 17:34:28,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,237 - INFO - Going to convert document batch...
2025-11-14 17:34:28,238 - INFO - Processing document 8-K_2023-11-17
2025-11-14 17:34:28,263 - INFO - Finished converting document 8-K_2023-11-17 in 0.09 sec.
2025-11-14 17:34:28,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,300 - INFO - Going to convert document batch...
2025-11-14 17:34:28,302 - INFO - Processing document 8-K_2024-01-17
2025-11-14 17:34:28,318 - INFO - Finished converting document 8-K_2024-01-17 in 0.05 sec.


Converted 'data\edgar_documents\SCHW\8-K_2023-08-24' --> 'data\processed_data\SCHW\8-K_2023-08-24.md'
Converted 'data\edgar_documents\SCHW\8-K_2023-10-16' --> 'data\processed_data\SCHW\8-K_2023-10-16.md'
Converted 'data\edgar_documents\SCHW\8-K_2023-11-17' --> 'data\processed_data\SCHW\8-K_2023-11-17.md'


2025-11-14 17:34:28,343 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,354 - INFO - Going to convert document batch...
2025-11-14 17:34:28,355 - INFO - Processing document 8-K_2024-04-15
2025-11-14 17:34:28,372 - INFO - Finished converting document 8-K_2024-04-15 in 0.05 sec.
2025-11-14 17:34:28,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,410 - INFO - Going to convert document batch...
2025-11-14 17:34:28,411 - INFO - Processing document 8-K_2024-05-16
2025-11-14 17:34:28,430 - INFO - Finished converting document 8-K_2024-05-16 in 0.05 sec.
2025-11-14 17:34:28,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,471 - INFO - Going to convert document batch...
2025-11-14 17:34:28,472 - INFO - Processing document 8-K_2024-05-29
2025-11-14 17:34:28,499 - INFO - Finished converting document 8-K_2024-05-29 in 0.06 sec.


Converted 'data\edgar_documents\SCHW\8-K_2024-01-17' --> 'data\processed_data\SCHW\8-K_2024-01-17.md'
Converted 'data\edgar_documents\SCHW\8-K_2024-04-15' --> 'data\processed_data\SCHW\8-K_2024-04-15.md'
Converted 'data\edgar_documents\SCHW\8-K_2024-05-16' --> 'data\processed_data\SCHW\8-K_2024-05-16.md'
Converted 'data\edgar_documents\SCHW\8-K_2024-05-29' --> 'data\processed_data\SCHW\8-K_2024-05-29.md'


2025-11-14 17:34:28,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,558 - INFO - Going to convert document batch...
2025-11-14 17:34:28,558 - INFO - Processing document 8-K_2024-07-16
2025-11-14 17:34:28,578 - INFO - Finished converting document 8-K_2024-07-16 in 0.06 sec.
2025-11-14 17:34:28,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,612 - INFO - Going to convert document batch...
2025-11-14 17:34:28,613 - INFO - Processing document 8-K_2024-07-25
2025-11-14 17:34:28,628 - INFO - Finished converting document 8-K_2024-07-25 in 0.03 sec.
2025-11-14 17:34:28,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,685 - INFO - Going to convert document batch...
2025-11-14 17:34:28,686 - INFO - Processing document 8-K_2024-10-01
2025-11-14 17:34:28,703 - INFO - Finished converting document 8-K_2024-10-01 in 0.06 sec.
2025-11-14 17:34:28,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\SCHW\8-K_2024-07-16' --> 'data\processed_data\SCHW\8-K_2024-07-16.md'
Converted 'data\edgar_documents\SCHW\8-K_2024-07-25' --> 'data\processed_data\SCHW\8-K_2024-07-25.md'
Converted 'data\edgar_documents\SCHW\8-K_2024-10-01' --> 'data\processed_data\SCHW\8-K_2024-10-01.md'


2025-11-14 17:34:28,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,809 - INFO - Going to convert document batch...
2025-11-14 17:34:28,810 - INFO - Processing document 8-K_2025-01-21
2025-11-14 17:34:28,829 - INFO - Finished converting document 8-K_2025-01-21 in 0.05 sec.
2025-11-14 17:34:28,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:28,884 - INFO - Going to convert document batch...
2025-11-14 17:34:28,884 - INFO - Processing document 8-K_2025-02-10
2025-11-14 17:34:28,938 - INFO - Finished converting document 8-K_2025-02-10 in 0.09 sec.


Converted 'data\edgar_documents\SCHW\8-K_2024-10-15' --> 'data\processed_data\SCHW\8-K_2024-10-15.md'
Converted 'data\edgar_documents\SCHW\8-K_2025-01-21' --> 'data\processed_data\SCHW\8-K_2025-01-21.md'
Converted 'data\edgar_documents\SCHW\8-K_2025-02-10' --> 'data\processed_data\SCHW\8-K_2025-02-10.md'


2025-11-14 17:34:28,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:29,015 - INFO - Going to convert document batch...
2025-11-14 17:34:29,015 - INFO - Processing document 8-K_2025-02-12
2025-11-14 17:34:29,038 - INFO - Finished converting document 8-K_2025-02-12 in 0.06 sec.
2025-11-14 17:34:29,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:29,074 - INFO - Going to convert document batch...
2025-11-14 17:34:29,075 - INFO - Processing document 8-K_2025-04-01
2025-11-14 17:34:29,091 - INFO - Finished converting document 8-K_2025-04-01 in 0.05 sec.
2025-11-14 17:34:29,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:29,124 - INFO - Going to convert document batch...
2025-11-14 17:34:29,126 - INFO - Processing document 8-K_2025-04-17
2025-11-14 17:34:29,146 - INFO - Finished converting document 8-K_2025-04-17 in 0.05 sec.
2025-11-14 17:34:29,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\SCHW\8-K_2025-02-12' --> 'data\processed_data\SCHW\8-K_2025-02-12.md'
Converted 'data\edgar_documents\SCHW\8-K_2025-04-01' --> 'data\processed_data\SCHW\8-K_2025-04-01.md'
Converted 'data\edgar_documents\SCHW\8-K_2025-04-17' --> 'data\processed_data\SCHW\8-K_2025-04-17.md'
Converted 'data\edgar_documents\SCHW\8-K_2025-05-23' --> 'data\processed_data\SCHW\8-K_2025-05-23.md'


2025-11-14 17:34:29,250 - INFO - Going to convert document batch...
2025-11-14 17:34:29,251 - INFO - Processing document 8-K_2025-06-02
2025-11-14 17:34:29,269 - INFO - Finished converting document 8-K_2025-06-02 in 0.05 sec.
2025-11-14 17:34:29,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:29,302 - INFO - Going to convert document batch...
2025-11-14 17:34:29,302 - INFO - Processing document 8-K_2025-07-18
2025-11-14 17:34:29,320 - INFO - Finished converting document 8-K_2025-07-18 in 0.03 sec.
2025-11-14 17:34:29,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:29,373 - INFO - Going to convert document batch...
2025-11-14 17:34:29,374 - INFO - Processing document 8-K_2025-10-16
2025-11-14 17:34:29,391 - INFO - Finished converting document 8-K_2025-10-16 in 0.06 sec.
2025-11-14 17:34:29,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:29,425 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SCHW\8-K_2025-06-02' --> 'data\processed_data\SCHW\8-K_2025-06-02.md'
Converted 'data\edgar_documents\SCHW\8-K_2025-07-18' --> 'data\processed_data\SCHW\8-K_2025-07-18.md'
Converted 'data\edgar_documents\SCHW\8-K_2025-10-16' --> 'data\processed_data\SCHW\8-K_2025-10-16.md'
Converted 'data\edgar_documents\SCHW\8-K_2025-11-06' --> 'data\processed_data\SCHW\8-K_2025-11-06.md'


2025-11-14 17:34:29,482 - ERROR - Input document DEF-14A_2023-03-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:34:29,483 - INFO - Going to convert document batch...
2025-11-14 17:34:29,517 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:34:29,517 - ERROR - Input document DEF-14A_2024-04-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: '

Error processing data\edgar_documents\SCHW\DEF-14A_2023-03-31: File format not allowed: data\edgar_documents\SCHW\DEF-14A_2023-03-31
Error processing data\edgar_documents\SCHW\DEF-14A_2024-04-05: File format not allowed: data\edgar_documents\SCHW\DEF-14A_2024-04-05
Error processing data\edgar_documents\SCHW\DEF-14A_2025-04-04: File format not allowed: data\edgar_documents\SCHW\DEF-14A_2025-04-04
Processed 194 new files. Errors: 10
Found 162 files to process in data\edgar_documents\SO


2025-11-14 17:34:30,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:34,139 - INFO - Going to convert document batch...
2025-11-14 17:34:34,141 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:34:34,143 - INFO - Processing document 10-K_2023-02-16
2025-11-14 17:34:44,663 - INFO - Finished converting document 10-K_2023-02-16 in 15.09 sec.


Converted 'data\edgar_documents\SO\10-K_2023-02-16' --> 'data\processed_data\SO\10-K_2023-02-16.md'


2025-11-14 17:34:47,727 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:34:52,361 - INFO - Going to convert document batch...
2025-11-14 17:34:52,361 - INFO - Processing document 10-K_2024-02-15
2025-11-14 17:35:02,493 - INFO - Finished converting document 10-K_2024-02-15 in 15.09 sec.


Converted 'data\edgar_documents\SO\10-K_2024-02-15' --> 'data\processed_data\SO\10-K_2024-02-15.md'


2025-11-14 17:35:05,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:35:11,149 - INFO - Going to convert document batch...
2025-11-14 17:35:11,149 - INFO - Processing document 10-K_2025-02-20
2025-11-14 17:35:21,706 - INFO - Finished converting document 10-K_2025-02-20 in 16.45 sec.
2025-11-14 17:35:24,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-K_2025-02-20' --> 'data\processed_data\SO\10-K_2025-02-20.md'


2025-11-14 17:35:25,990 - INFO - Going to convert document batch...
2025-11-14 17:35:25,992 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 17:35:28,801 - INFO - Finished converting document 10-Q_2023-04-27 in 4.39 sec.
2025-11-14 17:35:30,413 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-Q_2023-04-27' --> 'data\processed_data\SO\10-Q_2023-04-27.md'


2025-11-14 17:35:33,945 - INFO - Going to convert document batch...
2025-11-14 17:35:33,946 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 17:35:37,374 - INFO - Finished converting document 10-Q_2023-08-03 in 7.11 sec.
2025-11-14 17:35:39,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-Q_2023-08-03' --> 'data\processed_data\SO\10-Q_2023-08-03.md'


2025-11-14 17:35:41,545 - INFO - Going to convert document batch...
2025-11-14 17:35:41,547 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 17:35:45,642 - INFO - Finished converting document 10-Q_2023-11-02 in 6.75 sec.
2025-11-14 17:35:47,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-Q_2023-11-02' --> 'data\processed_data\SO\10-Q_2023-11-02.md'


2025-11-14 17:35:48,626 - INFO - Going to convert document batch...
2025-11-14 17:35:48,627 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 17:35:52,447 - INFO - Finished converting document 10-Q_2024-05-02 in 5.20 sec.
2025-11-14 17:35:54,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-Q_2024-05-02' --> 'data\processed_data\SO\10-Q_2024-05-02.md'


2025-11-14 17:35:56,493 - INFO - Going to convert document batch...
2025-11-14 17:35:56,494 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 17:35:59,847 - INFO - Finished converting document 10-Q_2024-08-01 in 5.99 sec.
2025-11-14 17:36:01,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-Q_2024-08-01' --> 'data\processed_data\SO\10-Q_2024-08-01.md'


2025-11-14 17:36:04,473 - INFO - Going to convert document batch...
2025-11-14 17:36:04,474 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 17:36:07,995 - INFO - Finished converting document 10-Q_2024-10-31 in 6.61 sec.
2025-11-14 17:36:09,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-Q_2024-10-31' --> 'data\processed_data\SO\10-Q_2024-10-31.md'


2025-11-14 17:36:11,968 - INFO - Going to convert document batch...
2025-11-14 17:36:11,968 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 17:36:14,778 - INFO - Finished converting document 10-Q_2025-05-01 in 5.20 sec.
2025-11-14 17:36:17,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-Q_2025-05-01' --> 'data\processed_data\SO\10-Q_2025-05-01.md'


2025-11-14 17:36:19,180 - INFO - Going to convert document batch...
2025-11-14 17:36:19,181 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 17:36:22,596 - INFO - Finished converting document 10-Q_2025-07-31 in 5.62 sec.
2025-11-14 17:36:24,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-Q_2025-07-31' --> 'data\processed_data\SO\10-Q_2025-07-31.md'


2025-11-14 17:36:27,271 - INFO - Going to convert document batch...
2025-11-14 17:36:27,273 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 17:36:30,850 - INFO - Finished converting document 10-Q_2025-10-30 in 6.72 sec.
2025-11-14 17:36:32,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:32,537 - INFO - Going to convert document batch...
2025-11-14 17:36:32,537 - INFO - Processing document 4_2023-01-03
2025-11-14 17:36:32,559 - INFO - Finished converting document 4_2023-01-03 in 0.06 sec.
2025-11-14 17:36:32,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:32,616 - INFO - Going to convert document batch...
2025-11-14 17:36:32,616 - INFO - Processing document 4_2023-01-05
2025-11-14 17:36:32,634 - INFO - Finished converting document 4_2023-01-05 in 0.03 sec.
2025-11-14 17:36:32,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\10-Q_2025-10-30' --> 'data\processed_data\SO\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\SO\4_2023-01-03' --> 'data\processed_data\SO\4_2023-01-03.md'
Converted 'data\edgar_documents\SO\4_2023-01-05' --> 'data\processed_data\SO\4_2023-01-05.md'


2025-11-14 17:36:32,692 - INFO - Going to convert document batch...
2025-11-14 17:36:32,692 - INFO - Processing document 4_2023-01-11
2025-11-14 17:36:32,714 - INFO - Finished converting document 4_2023-01-11 in 0.06 sec.
2025-11-14 17:36:32,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:32,761 - INFO - Going to convert document batch...
2025-11-14 17:36:32,762 - INFO - Processing document 4_2023-02-07
2025-11-14 17:36:32,785 - INFO - Finished converting document 4_2023-02-07 in 0.05 sec.
2025-11-14 17:36:32,833 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:32,847 - INFO - Going to convert document batch...
2025-11-14 17:36:32,848 - INFO - Processing document 4_2023-02-09
2025-11-14 17:36:32,866 - INFO - Finished converting document 4_2023-02-09 in 0.06 sec.
2025-11-14 17:36:32,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:32,906 - INFO - Going to convert document batch...
2025-11-14 17:36:32,906 - 

Converted 'data\edgar_documents\SO\4_2023-01-11' --> 'data\processed_data\SO\4_2023-01-11.md'
Converted 'data\edgar_documents\SO\4_2023-02-07' --> 'data\processed_data\SO\4_2023-02-07.md'
Converted 'data\edgar_documents\SO\4_2023-02-09' --> 'data\processed_data\SO\4_2023-02-09.md'


2025-11-14 17:36:32,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:32,974 - INFO - Going to convert document batch...
2025-11-14 17:36:32,975 - INFO - Processing document 4_2023-02-15
2025-11-14 17:36:33,003 - INFO - Finished converting document 4_2023-02-15 in 0.05 sec.
2025-11-14 17:36:33,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,079 - INFO - Going to convert document batch...
2025-11-14 17:36:33,080 - INFO - Processing document 4_2023-02-17
2025-11-14 17:36:33,108 - INFO - Finished converting document 4_2023-02-17 in 0.08 sec.
2025-11-14 17:36:33,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\4_2023-02-14' --> 'data\processed_data\SO\4_2023-02-14.md'
Converted 'data\edgar_documents\SO\4_2023-02-15' --> 'data\processed_data\SO\4_2023-02-15.md'
Converted 'data\edgar_documents\SO\4_2023-02-17' --> 'data\processed_data\SO\4_2023-02-17.md'


2025-11-14 17:36:33,148 - INFO - Going to convert document batch...
2025-11-14 17:36:33,149 - INFO - Processing document 4_2023-03-02
2025-11-14 17:36:33,166 - INFO - Finished converting document 4_2023-03-02 in 0.03 sec.
2025-11-14 17:36:33,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,211 - INFO - Going to convert document batch...
2025-11-14 17:36:33,211 - INFO - Processing document 4_2023-04-03
2025-11-14 17:36:33,231 - INFO - Finished converting document 4_2023-04-03 in 0.05 sec.
2025-11-14 17:36:33,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,297 - INFO - Going to convert document batch...
2025-11-14 17:36:33,299 - INFO - Processing document 4_2023-04-11
2025-11-14 17:36:33,316 - INFO - Finished converting document 4_2023-04-11 in 0.06 sec.
2025-11-14 17:36:33,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,360 - INFO - Going to convert document batch...
2025-11-14 17:36:33,361 - 

Converted 'data\edgar_documents\SO\4_2023-03-02' --> 'data\processed_data\SO\4_2023-03-02.md'
Converted 'data\edgar_documents\SO\4_2023-04-03' --> 'data\processed_data\SO\4_2023-04-03.md'
Converted 'data\edgar_documents\SO\4_2023-04-11' --> 'data\processed_data\SO\4_2023-04-11.md'


2025-11-14 17:36:33,384 - INFO - Finished converting document 4_2023-05-09 in 0.03 sec.
2025-11-14 17:36:33,422 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,432 - INFO - Going to convert document batch...
2025-11-14 17:36:33,433 - INFO - Processing document 4_2023-05-11
2025-11-14 17:36:33,457 - INFO - Finished converting document 4_2023-05-11 in 0.05 sec.
2025-11-14 17:36:33,499 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:33,500 - ERROR - Input document 4_2023-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_g

Converted 'data\edgar_documents\SO\4_2023-05-09' --> 'data\processed_data\SO\4_2023-05-09.md'
Converted 'data\edgar_documents\SO\4_2023-05-11' --> 'data\processed_data\SO\4_2023-05-11.md'
Error processing data\edgar_documents\SO\4_2023-05-15: File format not allowed: data\edgar_documents\SO\4_2023-05-15
Error processing data\edgar_documents\SO\4_2023-05-16: File format not allowed: data\edgar_documents\SO\4_2023-05-16


2025-11-14 17:36:33,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,613 - INFO - Going to convert document batch...
2025-11-14 17:36:33,613 - INFO - Processing document 4_2023-06-06
2025-11-14 17:36:33,637 - INFO - Finished converting document 4_2023-06-06 in 0.05 sec.
2025-11-14 17:36:33,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,700 - INFO - Going to convert document batch...
2025-11-14 17:36:33,701 - INFO - Processing document 4_2023-06-12
2025-11-14 17:36:33,723 - INFO - Finished converting document 4_2023-06-12 in 0.05 sec.
2025-11-14 17:36:33,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,766 - INFO - Going to convert document batch...
2025-11-14 17:36:33,767 - INFO - Processing document 4_2023-06-13
2025-11-14 17:36:33,787 - INFO - Finished converting document 4_2023-06-13 in 0.03 sec.


Converted 'data\edgar_documents\SO\4_2023-06-02' --> 'data\processed_data\SO\4_2023-06-02.md'
Converted 'data\edgar_documents\SO\4_2023-06-06' --> 'data\processed_data\SO\4_2023-06-06.md'
Converted 'data\edgar_documents\SO\4_2023-06-12' --> 'data\processed_data\SO\4_2023-06-12.md'


2025-11-14 17:36:33,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,844 - INFO - Going to convert document batch...
2025-11-14 17:36:33,846 - INFO - Processing document 4_2023-07-03
2025-11-14 17:36:33,877 - INFO - Finished converting document 4_2023-07-03 in 0.06 sec.
2025-11-14 17:36:33,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:33,946 - INFO - Going to convert document batch...
2025-11-14 17:36:33,947 - INFO - Processing document 4_2023-07-05
2025-11-14 17:36:33,971 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.


Converted 'data\edgar_documents\SO\4_2023-06-13' --> 'data\processed_data\SO\4_2023-06-13.md'
Converted 'data\edgar_documents\SO\4_2023-07-03' --> 'data\processed_data\SO\4_2023-07-03.md'


2025-11-14 17:36:34,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,017 - INFO - Going to convert document batch...
2025-11-14 17:36:34,017 - INFO - Processing document 4_2023-07-11
2025-11-14 17:36:34,038 - INFO - Finished converting document 4_2023-07-11 in 0.03 sec.
2025-11-14 17:36:34,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,084 - INFO - Going to convert document batch...
2025-11-14 17:36:34,084 - INFO - Processing document 4_2023-07-24
2025-11-14 17:36:34,104 - INFO - Finished converting document 4_2023-07-24 in 0.05 sec.
2025-11-14 17:36:34,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,143 - INFO - Going to convert document batch...
2025-11-14 17:36:34,144 - INFO - Processing document 4_2023-08-11
2025-11-14 17:36:34,161 - INFO - Finished converting document 4_2023-08-11 in 0.03 sec.


Converted 'data\edgar_documents\SO\4_2023-07-05' --> 'data\processed_data\SO\4_2023-07-05.md'
Converted 'data\edgar_documents\SO\4_2023-07-11' --> 'data\processed_data\SO\4_2023-07-11.md'
Converted 'data\edgar_documents\SO\4_2023-07-24' --> 'data\processed_data\SO\4_2023-07-24.md'
Converted 'data\edgar_documents\SO\4_2023-08-11' --> 'data\processed_data\SO\4_2023-08-11.md'


2025-11-14 17:36:34,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,218 - INFO - Going to convert document batch...
2025-11-14 17:36:34,219 - INFO - Processing document 4_2023-08-31
2025-11-14 17:36:34,241 - INFO - Finished converting document 4_2023-08-31 in 0.06 sec.
2025-11-14 17:36:34,280 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:34,281 - ERROR - Input document 4_2023-09-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:36

Converted 'data\edgar_documents\SO\4_2023-08-31' --> 'data\processed_data\SO\4_2023-08-31.md'
Error processing data\edgar_documents\SO\4_2023-09-05: File format not allowed: data\edgar_documents\SO\4_2023-09-05
Error processing data\edgar_documents\SO\4_2023-09-06: File format not allowed: data\edgar_documents\SO\4_2023-09-06
Converted 'data\edgar_documents\SO\4_2023-09-12' --> 'data\processed_data\SO\4_2023-09-12.md'
Converted 'data\edgar_documents\SO\4_2023-10-02' --> 'data\processed_data\SO\4_2023-10-02.md'


2025-11-14 17:36:34,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,502 - INFO - Going to convert document batch...
2025-11-14 17:36:34,503 - INFO - Processing document 4_2023-11-13
2025-11-14 17:36:34,530 - INFO - Finished converting document 4_2023-11-13 in 0.05 sec.
2025-11-14 17:36:34,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,592 - INFO - Going to convert document batch...
2025-11-14 17:36:34,592 - INFO - Processing document 4_2023-11-17
2025-11-14 17:36:34,615 - INFO - Finished converting document 4_2023-11-17 in 0.05 sec.
2025-11-14 17:36:34,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,660 - INFO - Going to convert document batch...
2025-11-14 17:36:34,661 - INFO - Processing document 4_2023-12-12
2025-11-14 17:36:34,679 - INFO - Finished converting document 4_2023-12-12 in 0.03 sec.


Converted 'data\edgar_documents\SO\4_2023-10-11' --> 'data\processed_data\SO\4_2023-10-11.md'
Converted 'data\edgar_documents\SO\4_2023-11-13' --> 'data\processed_data\SO\4_2023-11-13.md'
Converted 'data\edgar_documents\SO\4_2023-11-17' --> 'data\processed_data\SO\4_2023-11-17.md'


2025-11-14 17:36:34,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,720 - INFO - Going to convert document batch...
2025-11-14 17:36:34,721 - INFO - Processing document 4_2024-01-02
2025-11-14 17:36:34,741 - INFO - Finished converting document 4_2024-01-02 in 0.03 sec.
2025-11-14 17:36:34,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,785 - INFO - Going to convert document batch...
2025-11-14 17:36:34,785 - INFO - Processing document 4_2024-01-10
2025-11-14 17:36:34,804 - INFO - Finished converting document 4_2024-01-10 in 0.03 sec.
2025-11-14 17:36:34,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,850 - INFO - Going to convert document batch...
2025-11-14 17:36:34,850 - INFO - Processing document 4_2024-01-18
2025-11-14 17:36:34,872 - INFO - Finished converting document 4_2024-01-18 in 0.05 sec.


Converted 'data\edgar_documents\SO\4_2023-12-12' --> 'data\processed_data\SO\4_2023-12-12.md'
Converted 'data\edgar_documents\SO\4_2024-01-02' --> 'data\processed_data\SO\4_2024-01-02.md'
Converted 'data\edgar_documents\SO\4_2024-01-10' --> 'data\processed_data\SO\4_2024-01-10.md'


2025-11-14 17:36:34,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,915 - INFO - Going to convert document batch...
2025-11-14 17:36:34,917 - INFO - Processing document 4_2024-02-02
2025-11-14 17:36:34,944 - INFO - Finished converting document 4_2024-02-02 in 0.05 sec.
2025-11-14 17:36:34,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:34,993 - INFO - Going to convert document batch...
2025-11-14 17:36:34,993 - INFO - Processing document 4_2024-02-06
2025-11-14 17:36:35,020 - INFO - Finished converting document 4_2024-02-06 in 0.05 sec.
2025-11-14 17:36:35,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:35,063 - INFO - Going to convert document batch...
2025-11-14 17:36:35,063 - INFO - Processing document 4_2024-02-07
2025-11-14 17:36:35,082 - INFO - Finished converting document 4_2024-02-07 in 0.03 sec.


Converted 'data\edgar_documents\SO\4_2024-01-18' --> 'data\processed_data\SO\4_2024-01-18.md'
Converted 'data\edgar_documents\SO\4_2024-02-02' --> 'data\processed_data\SO\4_2024-02-02.md'
Converted 'data\edgar_documents\SO\4_2024-02-06' --> 'data\processed_data\SO\4_2024-02-06.md'


2025-11-14 17:36:35,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:35,123 - INFO - Going to convert document batch...
2025-11-14 17:36:35,124 - INFO - Processing document 4_2024-02-08
2025-11-14 17:36:35,148 - INFO - Finished converting document 4_2024-02-08 in 0.05 sec.
2025-11-14 17:36:35,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:35,198 - INFO - Going to convert document batch...
2025-11-14 17:36:35,198 - INFO - Processing document 4_2024-02-09
2025-11-14 17:36:35,224 - INFO - Finished converting document 4_2024-02-09 in 0.05 sec.
2025-11-14 17:36:35,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:35,268 - INFO - Going to convert document batch...
2025-11-14 17:36:35,269 - INFO - Processing document 4_2024-02-13
2025-11-14 17:36:35,286 - INFO - Finished converting document 4_2024-02-13 in 0.03 sec.


Converted 'data\edgar_documents\SO\4_2024-02-07' --> 'data\processed_data\SO\4_2024-02-07.md'
Converted 'data\edgar_documents\SO\4_2024-02-08' --> 'data\processed_data\SO\4_2024-02-08.md'
Converted 'data\edgar_documents\SO\4_2024-02-09' --> 'data\processed_data\SO\4_2024-02-09.md'


2025-11-14 17:36:35,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:35,325 - INFO - Going to convert document batch...
2025-11-14 17:36:35,326 - INFO - Processing document 4_2024-02-14
2025-11-14 17:36:35,350 - INFO - Finished converting document 4_2024-02-14 in 0.05 sec.
2025-11-14 17:36:35,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:35,397 - INFO - Going to convert document batch...
2025-11-14 17:36:35,398 - INFO - Processing document 4_2024-02-16
2025-11-14 17:36:35,418 - INFO - Finished converting document 4_2024-02-16 in 0.05 sec.
2025-11-14 17:36:35,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:35,456 - INFO - Going to convert document batch...
2025-11-14 17:36:35,457 - INFO - Processing document 4_2024-02-20
2025-11-14 17:36:35,474 - INFO - Finished converting document 4_2024-02-20 in 0.03 sec.


Converted 'data\edgar_documents\SO\4_2024-02-13' --> 'data\processed_data\SO\4_2024-02-13.md'
Converted 'data\edgar_documents\SO\4_2024-02-14' --> 'data\processed_data\SO\4_2024-02-14.md'
Converted 'data\edgar_documents\SO\4_2024-02-16' --> 'data\processed_data\SO\4_2024-02-16.md'


2025-11-14 17:36:35,509 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:35,510 - ERROR - Input document 4_2024-02-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:36:35,511 - INFO - Going to convert document batch...
2025-11-14 17:36:35,529 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:35,529 - ERROR - Input document 4_2024-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\SO\4_2024-02-20' --> 'data\processed_data\SO\4_2024-02-20.md'
Error processing data\edgar_documents\SO\4_2024-02-26: File format not allowed: data\edgar_documents\SO\4_2024-02-26
Error processing data\edgar_documents\SO\4_2024-02-27: File format not allowed: data\edgar_documents\SO\4_2024-02-27
Converted 'data\edgar_documents\SO\4_2024-03-12' --> 'data\processed_data\SO\4_2024-03-12.md'
Converted 'data\edgar_documents\SO\4_2024-03-15' --> 'data\processed_data\SO\4_2024-03-15.md'


2025-11-14 17:36:35,689 - INFO - Processing document 4_2024-04-05
2025-11-14 17:36:35,709 - INFO - Finished converting document 4_2024-04-05 in 0.03 sec.
2025-11-14 17:36:35,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:35,772 - INFO - Going to convert document batch...
2025-11-14 17:36:35,773 - INFO - Processing document 4_2024-05-02
2025-11-14 17:36:35,800 - INFO - Finished converting document 4_2024-05-02 in 0.06 sec.
2025-11-14 17:36:35,834 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:35,835 - ERROR - Input document 4_2024-05-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\SO\4_2024-04-05' --> 'data\processed_data\SO\4_2024-04-05.md'
Converted 'data\edgar_documents\SO\4_2024-05-02' --> 'data\processed_data\SO\4_2024-05-02.md'
Error processing data\edgar_documents\SO\4_2024-05-03: File format not allowed: data\edgar_documents\SO\4_2024-05-03


2025-11-14 17:36:36,871 - INFO - Finished converting document 4_2024-05-22 in 1.05 sec.
2025-11-14 17:36:36,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:36,913 - INFO - Going to convert document batch...
2025-11-14 17:36:36,915 - INFO - Processing document 4_2024-07-03
2025-11-14 17:36:36,935 - INFO - Finished converting document 4_2024-07-03 in 0.05 sec.
2025-11-14 17:36:36,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:36,981 - INFO - Going to convert document batch...
2025-11-14 17:36:36,982 - INFO - Processing document 4_2024-07-08
2025-11-14 17:36:37,002 - INFO - Finished converting document 4_2024-07-08 in 0.05 sec.
2025-11-14 17:36:37,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,044 - INFO - Going to convert document batch...
2025-11-14 17:36:37,044 - INFO - Processing document 4_2024-08-06
2025-11-14 17:36:37,066 - INFO - Finished converting document 4_2024-08-06 in 0.05 sec.


Converted 'data\edgar_documents\SO\4_2024-05-22' --> 'data\processed_data\SO\4_2024-05-22.md'
Converted 'data\edgar_documents\SO\4_2024-07-03' --> 'data\processed_data\SO\4_2024-07-03.md'
Converted 'data\edgar_documents\SO\4_2024-07-08' --> 'data\processed_data\SO\4_2024-07-08.md'


2025-11-14 17:36:37,113 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:37,114 - ERROR - Input document 4_2024-09-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:36:37,117 - INFO - Going to convert document batch...
2025-11-14 17:36:37,152 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:37,154 - ERROR - Input document 4_2024-09-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\SO\4_2024-08-06' --> 'data\processed_data\SO\4_2024-08-06.md'
Error processing data\edgar_documents\SO\4_2024-09-04: File format not allowed: data\edgar_documents\SO\4_2024-09-04
Error processing data\edgar_documents\SO\4_2024-09-05: File format not allowed: data\edgar_documents\SO\4_2024-09-05
Converted 'data\edgar_documents\SO\4_2024-09-09' --> 'data\processed_data\SO\4_2024-09-09.md'


2025-11-14 17:36:37,283 - INFO - Processing document 4_2024-10-02
2025-11-14 17:36:37,306 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.
2025-11-14 17:36:37,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,349 - INFO - Going to convert document batch...
2025-11-14 17:36:37,350 - INFO - Processing document 4_2024-10-08
2025-11-14 17:36:37,371 - INFO - Finished converting document 4_2024-10-08 in 0.05 sec.
2025-11-14 17:36:37,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,411 - INFO - Going to convert document batch...
2025-11-14 17:36:37,412 - INFO - Processing document 4_2024-11-05
2025-11-14 17:36:37,433 - INFO - Finished converting document 4_2024-11-05 in 0.05 sec.
2025-11-14 17:36:37,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,471 - INFO - Going to convert document batch...
2025-11-14 17:36:37,472 - INFO - Processing document 4_2024-11-15
2025-11-14 17:36:37,492 - IN

Converted 'data\edgar_documents\SO\4_2024-10-02' --> 'data\processed_data\SO\4_2024-10-02.md'
Converted 'data\edgar_documents\SO\4_2024-10-08' --> 'data\processed_data\SO\4_2024-10-08.md'
Converted 'data\edgar_documents\SO\4_2024-11-05' --> 'data\processed_data\SO\4_2024-11-05.md'


2025-11-14 17:36:37,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,532 - INFO - Going to convert document batch...
2025-11-14 17:36:37,533 - INFO - Processing document 4_2024-12-06
2025-11-14 17:36:37,552 - INFO - Finished converting document 4_2024-12-06 in 0.03 sec.
2025-11-14 17:36:37,587 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,597 - INFO - Going to convert document batch...
2025-11-14 17:36:37,598 - INFO - Processing document 4_2025-01-06
2025-11-14 17:36:37,618 - INFO - Finished converting document 4_2025-01-06 in 0.03 sec.
2025-11-14 17:36:37,655 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:37,656 - ERROR - Input document 4_2025-01-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\SO\4_2024-11-15' --> 'data\processed_data\SO\4_2024-11-15.md'
Converted 'data\edgar_documents\SO\4_2024-12-06' --> 'data\processed_data\SO\4_2024-12-06.md'
Converted 'data\edgar_documents\SO\4_2025-01-06' --> 'data\processed_data\SO\4_2025-01-06.md'
Error processing data\edgar_documents\SO\4_2025-01-08: File format not allowed: data\edgar_documents\SO\4_2025-01-08
Error processing data\edgar_documents\SO\4_2025-01-10: File format not allowed: data\edgar_documents\SO\4_2025-01-10


2025-11-14 17:36:37,703 - INFO - Processing document 4_2025-02-04
2025-11-14 17:36:37,733 - INFO - Finished converting document 4_2025-02-04 in 0.06 sec.
2025-11-14 17:36:37,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,784 - INFO - Going to convert document batch...
2025-11-14 17:36:37,785 - INFO - Processing document 4_2025-02-05
2025-11-14 17:36:37,803 - INFO - Finished converting document 4_2025-02-05 in 0.03 sec.
2025-11-14 17:36:37,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,844 - INFO - Going to convert document batch...
2025-11-14 17:36:37,845 - INFO - Processing document 4_2025-02-07
2025-11-14 17:36:37,870 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.
2025-11-14 17:36:37,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,915 - INFO - Going to convert document batch...
2025-11-14 17:36:37,916 - INFO - Processing document 4_2025-02-10
2025-11-14 17:36:37,938 - IN

Converted 'data\edgar_documents\SO\4_2025-02-04' --> 'data\processed_data\SO\4_2025-02-04.md'
Converted 'data\edgar_documents\SO\4_2025-02-05' --> 'data\processed_data\SO\4_2025-02-05.md'
Converted 'data\edgar_documents\SO\4_2025-02-07' --> 'data\processed_data\SO\4_2025-02-07.md'


2025-11-14 17:36:37,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:37,985 - INFO - Going to convert document batch...
2025-11-14 17:36:37,986 - INFO - Processing document 4_2025-02-11
2025-11-14 17:36:38,014 - INFO - Finished converting document 4_2025-02-11 in 0.06 sec.
2025-11-14 17:36:38,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,062 - INFO - Going to convert document batch...
2025-11-14 17:36:38,063 - INFO - Processing document 4_2025-02-12
2025-11-14 17:36:38,084 - INFO - Finished converting document 4_2025-02-12 in 0.03 sec.
2025-11-14 17:36:38,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,128 - INFO - Going to convert document batch...
2025-11-14 17:36:38,129 - INFO - Processing document 4_2025-02-18


Converted 'data\edgar_documents\SO\4_2025-02-10' --> 'data\processed_data\SO\4_2025-02-10.md'
Converted 'data\edgar_documents\SO\4_2025-02-11' --> 'data\processed_data\SO\4_2025-02-11.md'
Converted 'data\edgar_documents\SO\4_2025-02-12' --> 'data\processed_data\SO\4_2025-02-12.md'


2025-11-14 17:36:38,152 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 17:36:38,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,194 - INFO - Going to convert document batch...
2025-11-14 17:36:38,195 - INFO - Processing document 4_2025-02-20
2025-11-14 17:36:38,214 - INFO - Finished converting document 4_2025-02-20 in 0.05 sec.
2025-11-14 17:36:38,253 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:38,254 - ERROR - Input document 4_2025-02-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\SO\4_2025-02-18' --> 'data\processed_data\SO\4_2025-02-18.md'
Converted 'data\edgar_documents\SO\4_2025-02-20' --> 'data\processed_data\SO\4_2025-02-20.md'
Error processing data\edgar_documents\SO\4_2025-02-25: File format not allowed: data\edgar_documents\SO\4_2025-02-25
Converted 'data\edgar_documents\SO\4_2025-02-26' --> 'data\processed_data\SO\4_2025-02-26.md'


2025-11-14 17:36:38,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,397 - INFO - Going to convert document batch...
2025-11-14 17:36:38,397 - INFO - Processing document 4_2025-03-10
2025-11-14 17:36:38,421 - INFO - Finished converting document 4_2025-03-10 in 0.05 sec.
2025-11-14 17:36:38,481 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,494 - INFO - Going to convert document batch...
2025-11-14 17:36:38,495 - INFO - Processing document 4_2025-03-11
2025-11-14 17:36:38,516 - INFO - Finished converting document 4_2025-03-11 in 0.06 sec.
2025-11-14 17:36:38,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,553 - INFO - Going to convert document batch...
2025-11-14 17:36:38,554 - INFO - Processing document 4_2025-04-01


Converted 'data\edgar_documents\SO\4_2025-03-04' --> 'data\processed_data\SO\4_2025-03-04.md'
Converted 'data\edgar_documents\SO\4_2025-03-10' --> 'data\processed_data\SO\4_2025-03-10.md'
Converted 'data\edgar_documents\SO\4_2025-03-11' --> 'data\processed_data\SO\4_2025-03-11.md'


2025-11-14 17:36:38,574 - INFO - Finished converting document 4_2025-04-01 in 0.05 sec.
2025-11-14 17:36:38,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,617 - INFO - Going to convert document batch...
2025-11-14 17:36:38,618 - INFO - Processing document 4_2025-04-03
2025-11-14 17:36:38,640 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.
2025-11-14 17:36:38,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,683 - INFO - Going to convert document batch...
2025-11-14 17:36:38,684 - INFO - Processing document 4_2025-05-27
2025-11-14 17:36:38,707 - INFO - Finished converting document 4_2025-05-27 in 0.05 sec.
2025-11-14 17:36:38,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,748 - INFO - Going to convert document batch...
2025-11-14 17:36:38,750 - INFO - Processing document 4_2025-07-02
2025-11-14 17:36:38,769 - INFO - Finished converting document 4_2025-07-02 in 0.03 sec.
2025-1

Converted 'data\edgar_documents\SO\4_2025-04-01' --> 'data\processed_data\SO\4_2025-04-01.md'
Converted 'data\edgar_documents\SO\4_2025-04-03' --> 'data\processed_data\SO\4_2025-04-03.md'
Converted 'data\edgar_documents\SO\4_2025-05-27' --> 'data\processed_data\SO\4_2025-05-27.md'
Converted 'data\edgar_documents\SO\4_2025-07-02' --> 'data\processed_data\SO\4_2025-07-02.md'


2025-11-14 17:36:38,809 - INFO - Going to convert document batch...
2025-11-14 17:36:38,810 - INFO - Processing document 4_2025-07-22
2025-11-14 17:36:38,828 - INFO - Finished converting document 4_2025-07-22 in 0.05 sec.
2025-11-14 17:36:38,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,881 - INFO - Going to convert document batch...
2025-11-14 17:36:38,882 - INFO - Processing document 4_2025-08-12
2025-11-14 17:36:38,900 - INFO - Finished converting document 4_2025-08-12 in 0.05 sec.
2025-11-14 17:36:38,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,938 - INFO - Going to convert document batch...
2025-11-14 17:36:38,938 - INFO - Processing document 4_2025-10-01
2025-11-14 17:36:38,956 - INFO - Finished converting document 4_2025-10-01 in 0.03 sec.
2025-11-14 17:36:38,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:38,998 - INFO - Going to convert document batch...
2025-11-14 17:36:38,999 - 

Converted 'data\edgar_documents\SO\4_2025-07-22' --> 'data\processed_data\SO\4_2025-07-22.md'
Converted 'data\edgar_documents\SO\4_2025-08-12' --> 'data\processed_data\SO\4_2025-08-12.md'
Converted 'data\edgar_documents\SO\4_2025-10-01' --> 'data\processed_data\SO\4_2025-10-01.md'
Converted 'data\edgar_documents\SO\4_2025-10-02' --> 'data\processed_data\SO\4_2025-10-02.md'


2025-11-14 17:36:39,096 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:39,096 - ERROR - Input document 4_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:36:39,098 - INFO - Going to convert document batch...
2025-11-14 17:36:39,133 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:36:39,134 - ERROR - Input document 4_2025-11-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\SO\4_2025-11-03: File format not allowed: data\edgar_documents\SO\4_2025-11-03
Error processing data\edgar_documents\SO\4_2025-11-04: File format not allowed: data\edgar_documents\SO\4_2025-11-04
Converted 'data\edgar_documents\SO\4_2025-11-07' --> 'data\processed_data\SO\4_2025-11-07.md'
Converted 'data\edgar_documents\SO\8-K_2023-01-05' --> 'data\processed_data\SO\8-K_2023-01-05.md'


2025-11-14 17:36:39,302 - INFO - Going to convert document batch...
2025-11-14 17:36:39,304 - INFO - Processing document 8-K_2023-01-11
2025-11-14 17:36:39,327 - INFO - Finished converting document 8-K_2023-01-11 in 0.06 sec.
2025-11-14 17:36:39,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:39,382 - INFO - Going to convert document batch...
2025-11-14 17:36:39,384 - INFO - Processing document 8-K_2023-02-07
2025-11-14 17:36:39,410 - INFO - Finished converting document 8-K_2023-02-07 in 0.06 sec.
2025-11-14 17:36:39,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:39,451 - INFO - Going to convert document batch...
2025-11-14 17:36:39,452 - INFO - Processing document 8-K_2023-02-14
2025-11-14 17:36:39,469 - INFO - Finished converting document 8-K_2023-02-14 in 0.05 sec.
2025-11-14 17:36:39,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:39,521 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SO\8-K_2023-01-11' --> 'data\processed_data\SO\8-K_2023-01-11.md'
Converted 'data\edgar_documents\SO\8-K_2023-02-07' --> 'data\processed_data\SO\8-K_2023-02-07.md'
Converted 'data\edgar_documents\SO\8-K_2023-02-14' --> 'data\processed_data\SO\8-K_2023-02-14.md'


2025-11-14 17:36:39,561 - INFO - Finished converting document 8-K_2023-02-16 in 0.08 sec.
2025-11-14 17:36:39,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:39,609 - INFO - Going to convert document batch...
2025-11-14 17:36:39,611 - INFO - Processing document 8-K_2023-02-23
2025-11-14 17:36:39,632 - INFO - Finished converting document 8-K_2023-02-23 in 0.05 sec.
2025-11-14 17:36:39,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:39,692 - INFO - Going to convert document batch...
2025-11-14 17:36:39,693 - INFO - Processing document 8-K_2023-02-24
2025-11-14 17:36:39,713 - INFO - Finished converting document 8-K_2023-02-24 in 0.06 sec.
2025-11-14 17:36:39,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:39,755 - INFO - Going to convert document batch...
2025-11-14 17:36:39,755 - INFO - Processing document 8-K_2023-03-01
2025-11-14 17:36:39,778 - INFO - Finished converting document 8-K_2023-03-01 in 0.

Converted 'data\edgar_documents\SO\8-K_2023-02-16' --> 'data\processed_data\SO\8-K_2023-02-16.md'
Converted 'data\edgar_documents\SO\8-K_2023-02-23' --> 'data\processed_data\SO\8-K_2023-02-23.md'
Converted 'data\edgar_documents\SO\8-K_2023-02-24' --> 'data\processed_data\SO\8-K_2023-02-24.md'


2025-11-14 17:36:39,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:39,830 - INFO - Going to convert document batch...
2025-11-14 17:36:39,831 - INFO - Processing document 8-K_2023-04-27
2025-11-14 17:36:39,869 - INFO - Finished converting document 8-K_2023-04-27 in 0.06 sec.
2025-11-14 17:36:39,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:39,925 - INFO - Going to convert document batch...
2025-11-14 17:36:39,926 - INFO - Processing document 8-K_2023-05-18
2025-11-14 17:36:39,956 - INFO - Finished converting document 8-K_2023-05-18 in 0.06 sec.
2025-11-14 17:36:39,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\8-K_2023-03-01' --> 'data\processed_data\SO\8-K_2023-03-01.md'
Converted 'data\edgar_documents\SO\8-K_2023-04-27' --> 'data\processed_data\SO\8-K_2023-04-27.md'
Converted 'data\edgar_documents\SO\8-K_2023-05-18' --> 'data\processed_data\SO\8-K_2023-05-18.md'


2025-11-14 17:36:40,021 - INFO - Going to convert document batch...
2025-11-14 17:36:40,022 - INFO - Processing document 8-K_2023-05-26
2025-11-14 17:36:40,089 - INFO - Finished converting document 8-K_2023-05-26 in 0.12 sec.
2025-11-14 17:36:40,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:40,156 - INFO - Going to convert document batch...
2025-11-14 17:36:40,157 - INFO - Processing document 8-K_2023-06-16
2025-11-14 17:36:40,178 - INFO - Finished converting document 8-K_2023-06-16 in 0.05 sec.
2025-11-14 17:36:40,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:40,216 - INFO - Going to convert document batch...
2025-11-14 17:36:40,217 - INFO - Processing document 8-K_2023-07-18
2025-11-14 17:36:40,234 - INFO - Finished converting document 8-K_2023-07-18 in 0.05 sec.
2025-11-14 17:36:40,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:40,274 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SO\8-K_2023-05-26' --> 'data\processed_data\SO\8-K_2023-05-26.md'
Converted 'data\edgar_documents\SO\8-K_2023-06-16' --> 'data\processed_data\SO\8-K_2023-06-16.md'
Converted 'data\edgar_documents\SO\8-K_2023-07-18' --> 'data\processed_data\SO\8-K_2023-07-18.md'
Converted 'data\edgar_documents\SO\8-K_2023-07-31' --> 'data\processed_data\SO\8-K_2023-07-31.md'


2025-11-14 17:36:40,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:40,373 - INFO - Going to convert document batch...
2025-11-14 17:36:40,374 - INFO - Processing document 8-K_2023-08-03
2025-11-14 17:36:40,412 - INFO - Finished converting document 8-K_2023-08-03 in 0.09 sec.
2025-11-14 17:36:40,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:40,464 - INFO - Going to convert document batch...
2025-11-14 17:36:40,465 - INFO - Processing document 8-K_2023-08-30
2025-11-14 17:36:40,488 - INFO - Finished converting document 8-K_2023-08-30 in 0.05 sec.
2025-11-14 17:36:40,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:40,530 - INFO - Going to convert document batch...
2025-11-14 17:36:40,532 - INFO - Processing document 8-K_2023-09-08
2025-11-14 17:36:40,562 - INFO - Finished converting document 8-K_2023-09-08 in 0.06 sec.
2025-11-14 17:36:40,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\SO\8-K_2023-08-03' --> 'data\processed_data\SO\8-K_2023-08-03.md'
Converted 'data\edgar_documents\SO\8-K_2023-08-30' --> 'data\processed_data\SO\8-K_2023-08-30.md'
Converted 'data\edgar_documents\SO\8-K_2023-09-08' --> 'data\processed_data\SO\8-K_2023-09-08.md'


2025-11-14 17:36:40,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:40,677 - INFO - Going to convert document batch...
2025-11-14 17:36:40,678 - INFO - Processing document 8-K_2023-10-17
2025-11-14 17:36:40,697 - INFO - Finished converting document 8-K_2023-10-17 in 0.05 sec.
2025-11-14 17:36:40,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:40,750 - INFO - Going to convert document batch...
2025-11-14 17:36:40,751 - INFO - Processing document 8-K_2023-11-02
2025-11-14 17:36:40,792 - INFO - Finished converting document 8-K_2023-11-02 in 0.09 sec.
2025-11-14 17:36:40,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\8-K_2023-10-06' --> 'data\processed_data\SO\8-K_2023-10-06.md'
Converted 'data\edgar_documents\SO\8-K_2023-10-17' --> 'data\processed_data\SO\8-K_2023-10-17.md'
Converted 'data\edgar_documents\SO\8-K_2023-11-02' --> 'data\processed_data\SO\8-K_2023-11-02.md'


2025-11-14 17:36:41,068 - INFO - Going to convert document batch...
2025-11-14 17:36:41,069 - INFO - Processing document 8-K_2023-12-12
2025-11-14 17:36:41,086 - INFO - Finished converting document 8-K_2023-12-12 in 0.27 sec.
2025-11-14 17:36:41,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,152 - INFO - Going to convert document batch...
2025-11-14 17:36:41,153 - INFO - Processing document 8-K_2023-12-19
2025-11-14 17:36:41,182 - INFO - Finished converting document 8-K_2023-12-19 in 0.09 sec.
2025-11-14 17:36:41,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,219 - INFO - Going to convert document batch...
2025-11-14 17:36:41,219 - INFO - Processing document 8-K_2024-02-01
2025-11-14 17:36:41,241 - INFO - Finished converting document 8-K_2024-02-01 in 0.05 sec.
2025-11-14 17:36:41,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,274 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SO\8-K_2023-12-12' --> 'data\processed_data\SO\8-K_2023-12-12.md'
Converted 'data\edgar_documents\SO\8-K_2023-12-19' --> 'data\processed_data\SO\8-K_2023-12-19.md'
Converted 'data\edgar_documents\SO\8-K_2024-02-01' --> 'data\processed_data\SO\8-K_2024-02-01.md'


2025-11-14 17:36:41,294 - INFO - Finished converting document 8-K_2024-02-06 in 0.05 sec.
2025-11-14 17:36:41,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,340 - INFO - Going to convert document batch...
2025-11-14 17:36:41,342 - INFO - Processing document 8-K_2024-02-15
2025-11-14 17:36:41,380 - INFO - Finished converting document 8-K_2024-02-15 in 0.08 sec.
2025-11-14 17:36:41,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,450 - INFO - Going to convert document batch...
2025-11-14 17:36:41,451 - INFO - Processing document 8-K_2024-02-28
2025-11-14 17:36:41,481 - INFO - Finished converting document 8-K_2024-02-28 in 0.08 sec.


Converted 'data\edgar_documents\SO\8-K_2024-02-06' --> 'data\processed_data\SO\8-K_2024-02-06.md'
Converted 'data\edgar_documents\SO\8-K_2024-02-15' --> 'data\processed_data\SO\8-K_2024-02-15.md'


2025-11-14 17:36:41,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,526 - INFO - Going to convert document batch...
2025-11-14 17:36:41,527 - INFO - Processing document 8-K_2024-04-29
2025-11-14 17:36:41,550 - INFO - Finished converting document 8-K_2024-04-29 in 0.05 sec.
2025-11-14 17:36:41,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,620 - INFO - Going to convert document batch...
2025-11-14 17:36:41,621 - INFO - Processing document 8-K_2024-05-02
2025-11-14 17:36:41,664 - INFO - Finished converting document 8-K_2024-05-02 in 0.09 sec.


Converted 'data\edgar_documents\SO\8-K_2024-02-28' --> 'data\processed_data\SO\8-K_2024-02-28.md'
Converted 'data\edgar_documents\SO\8-K_2024-04-29' --> 'data\processed_data\SO\8-K_2024-04-29.md'
Converted 'data\edgar_documents\SO\8-K_2024-05-02' --> 'data\processed_data\SO\8-K_2024-05-02.md'


2025-11-14 17:36:41,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,735 - INFO - Going to convert document batch...
2025-11-14 17:36:41,737 - INFO - Processing document 8-K_2024-05-03
2025-11-14 17:36:41,760 - INFO - Finished converting document 8-K_2024-05-03 in 0.06 sec.
2025-11-14 17:36:41,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,804 - INFO - Going to convert document batch...
2025-11-14 17:36:41,804 - INFO - Processing document 8-K_2024-05-06
2025-11-14 17:36:41,827 - INFO - Finished converting document 8-K_2024-05-06 in 0.05 sec.
2025-11-14 17:36:41,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,865 - INFO - Going to convert document batch...
2025-11-14 17:36:41,866 - INFO - Processing document 8-K_2024-05-07
2025-11-14 17:36:41,887 - INFO - Finished converting document 8-K_2024-05-07 in 0.05 sec.
2025-11-14 17:36:41,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\SO\8-K_2024-05-03' --> 'data\processed_data\SO\8-K_2024-05-03.md'
Converted 'data\edgar_documents\SO\8-K_2024-05-06' --> 'data\processed_data\SO\8-K_2024-05-06.md'
Converted 'data\edgar_documents\SO\8-K_2024-05-07' --> 'data\processed_data\SO\8-K_2024-05-07.md'


2025-11-14 17:36:41,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:41,994 - INFO - Going to convert document batch...
2025-11-14 17:36:41,995 - INFO - Processing document 8-K_2024-05-13
2025-11-14 17:36:42,015 - INFO - Finished converting document 8-K_2024-05-13 in 0.05 sec.
2025-11-14 17:36:42,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,091 - INFO - Going to convert document batch...
2025-11-14 17:36:42,091 - INFO - Processing document 8-K_2024-05-24
2025-11-14 17:36:42,147 - INFO - Finished converting document 8-K_2024-05-24 in 0.11 sec.


Converted 'data\edgar_documents\SO\8-K_2024-05-09' --> 'data\processed_data\SO\8-K_2024-05-09.md'
Converted 'data\edgar_documents\SO\8-K_2024-05-13' --> 'data\processed_data\SO\8-K_2024-05-13.md'


2025-11-14 17:36:42,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,210 - INFO - Going to convert document batch...
2025-11-14 17:36:42,211 - INFO - Processing document 8-K_2024-08-01
2025-11-14 17:36:42,251 - INFO - Finished converting document 8-K_2024-08-01 in 0.08 sec.
2025-11-14 17:36:42,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,296 - INFO - Going to convert document batch...
2025-11-14 17:36:42,296 - INFO - Processing document 8-K_2024-09-09
2025-11-14 17:36:42,321 - INFO - Finished converting document 8-K_2024-09-09 in 0.05 sec.
2025-11-14 17:36:42,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,369 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SO\8-K_2024-05-24' --> 'data\processed_data\SO\8-K_2024-05-24.md'
Converted 'data\edgar_documents\SO\8-K_2024-08-01' --> 'data\processed_data\SO\8-K_2024-08-01.md'
Converted 'data\edgar_documents\SO\8-K_2024-09-09' --> 'data\processed_data\SO\8-K_2024-09-09.md'


2025-11-14 17:36:42,370 - INFO - Processing document 8-K_2024-10-31
2025-11-14 17:36:42,404 - INFO - Finished converting document 8-K_2024-10-31 in 0.08 sec.
2025-11-14 17:36:42,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,462 - INFO - Going to convert document batch...
2025-11-14 17:36:42,463 - INFO - Processing document 8-K_2024-12-10
2025-11-14 17:36:42,491 - INFO - Finished converting document 8-K_2024-12-10 in 0.06 sec.
2025-11-14 17:36:42,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,532 - INFO - Going to convert document batch...
2025-11-14 17:36:42,533 - INFO - Processing document 8-K_2025-01-13
2025-11-14 17:36:42,558 - INFO - Finished converting document 8-K_2025-01-13 in 0.06 sec.
2025-11-14 17:36:42,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\8-K_2024-10-31' --> 'data\processed_data\SO\8-K_2024-10-31.md'
Converted 'data\edgar_documents\SO\8-K_2024-12-10' --> 'data\processed_data\SO\8-K_2024-12-10.md'
Converted 'data\edgar_documents\SO\8-K_2025-01-13' --> 'data\processed_data\SO\8-K_2025-01-13.md'


2025-11-14 17:36:42,628 - INFO - Going to convert document batch...
2025-11-14 17:36:42,628 - INFO - Processing document 8-K_2025-02-11
2025-11-14 17:36:42,647 - INFO - Finished converting document 8-K_2025-02-11 in 0.06 sec.
2025-11-14 17:36:42,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,683 - INFO - Going to convert document batch...
2025-11-14 17:36:42,684 - INFO - Processing document 8-K_2025-02-12
2025-11-14 17:36:42,704 - INFO - Finished converting document 8-K_2025-02-12 in 0.05 sec.
2025-11-14 17:36:42,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,748 - INFO - Going to convert document batch...
2025-11-14 17:36:42,749 - INFO - Processing document 8-K_2025-02-20
2025-11-14 17:36:42,787 - INFO - Finished converting document 8-K_2025-02-20 in 0.06 sec.
2025-11-14 17:36:42,818 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,830 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SO\8-K_2025-02-11' --> 'data\processed_data\SO\8-K_2025-02-11.md'
Converted 'data\edgar_documents\SO\8-K_2025-02-12' --> 'data\processed_data\SO\8-K_2025-02-12.md'
Converted 'data\edgar_documents\SO\8-K_2025-02-20' --> 'data\processed_data\SO\8-K_2025-02-20.md'


2025-11-14 17:36:42,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:42,904 - INFO - Going to convert document batch...
2025-11-14 17:36:42,905 - INFO - Processing document 8-K_2025-05-01
2025-11-14 17:36:42,944 - INFO - Finished converting document 8-K_2025-05-01 in 0.06 sec.
2025-11-14 17:36:42,981 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,010 - INFO - Going to convert document batch...
2025-11-14 17:36:43,012 - INFO - Processing document 8-K_2025-05-19
2025-11-14 17:36:43,044 - INFO - Finished converting document 8-K_2025-05-19 in 0.09 sec.


Converted 'data\edgar_documents\SO\8-K_2025-02-28' --> 'data\processed_data\SO\8-K_2025-02-28.md'
Converted 'data\edgar_documents\SO\8-K_2025-05-01' --> 'data\processed_data\SO\8-K_2025-05-01.md'


2025-11-14 17:36:43,071 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,082 - INFO - Going to convert document batch...
2025-11-14 17:36:43,083 - INFO - Processing document 8-K_2025-05-20
2025-11-14 17:36:43,105 - INFO - Finished converting document 8-K_2025-05-20 in 0.05 sec.
2025-11-14 17:36:43,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,143 - INFO - Going to convert document batch...
2025-11-14 17:36:43,144 - INFO - Processing document 8-K_2025-05-21
2025-11-14 17:36:43,169 - INFO - Finished converting document 8-K_2025-05-21 in 0.06 sec.
2025-11-14 17:36:43,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,210 - INFO - Going to convert document batch...
2025-11-14 17:36:43,211 - INFO - Processing document 8-K_2025-05-27
2025-11-14 17:36:43,235 - INFO - Finished converting document 8-K_2025-05-27 in 0.05 sec.


Converted 'data\edgar_documents\SO\8-K_2025-05-19' --> 'data\processed_data\SO\8-K_2025-05-19.md'
Converted 'data\edgar_documents\SO\8-K_2025-05-20' --> 'data\processed_data\SO\8-K_2025-05-20.md'
Converted 'data\edgar_documents\SO\8-K_2025-05-21' --> 'data\processed_data\SO\8-K_2025-05-21.md'


2025-11-14 17:36:43,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,275 - INFO - Going to convert document batch...
2025-11-14 17:36:43,276 - INFO - Processing document 8-K_2025-07-01
2025-11-14 17:36:43,310 - INFO - Finished converting document 8-K_2025-07-01 in 0.06 sec.
2025-11-14 17:36:43,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,366 - INFO - Going to convert document batch...
2025-11-14 17:36:43,367 - INFO - Processing document 8-K_2025-07-11
2025-11-14 17:36:43,388 - INFO - Finished converting document 8-K_2025-07-11 in 0.06 sec.
2025-11-14 17:36:43,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,427 - INFO - Going to convert document batch...
2025-11-14 17:36:43,428 - INFO - Processing document 8-K_2025-07-18
2025-11-14 17:36:43,448 - INFO - Finished converting document 8-K_2025-07-18 in 0.05 sec.


Converted 'data\edgar_documents\SO\8-K_2025-05-27' --> 'data\processed_data\SO\8-K_2025-05-27.md'
Converted 'data\edgar_documents\SO\8-K_2025-07-01' --> 'data\processed_data\SO\8-K_2025-07-01.md'
Converted 'data\edgar_documents\SO\8-K_2025-07-11' --> 'data\processed_data\SO\8-K_2025-07-11.md'


2025-11-14 17:36:43,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,487 - INFO - Going to convert document batch...
2025-11-14 17:36:43,487 - INFO - Processing document 8-K_2025-07-23
2025-11-14 17:36:43,510 - INFO - Finished converting document 8-K_2025-07-23 in 0.05 sec.
2025-11-14 17:36:43,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,556 - INFO - Going to convert document batch...
2025-11-14 17:36:43,557 - INFO - Processing document 8-K_2025-07-31
2025-11-14 17:36:43,594 - INFO - Finished converting document 8-K_2025-07-31 in 0.08 sec.
2025-11-14 17:36:43,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,641 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SO\8-K_2025-07-18' --> 'data\processed_data\SO\8-K_2025-07-18.md'
Converted 'data\edgar_documents\SO\8-K_2025-07-23' --> 'data\processed_data\SO\8-K_2025-07-23.md'
Converted 'data\edgar_documents\SO\8-K_2025-07-31' --> 'data\processed_data\SO\8-K_2025-07-31.md'


2025-11-14 17:36:43,641 - INFO - Processing document 8-K_2025-09-15
2025-11-14 17:36:43,663 - INFO - Finished converting document 8-K_2025-09-15 in 0.05 sec.
2025-11-14 17:36:43,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,712 - INFO - Going to convert document batch...
2025-11-14 17:36:43,713 - INFO - Processing document 8-K_2025-10-30
2025-11-14 17:36:43,751 - INFO - Finished converting document 8-K_2025-10-30 in 0.08 sec.
2025-11-14 17:36:43,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:36:43,806 - INFO - Going to convert document batch...
2025-11-14 17:36:43,807 - INFO - Processing document 8-K_2025-11-06
2025-11-14 17:36:43,836 - INFO - Finished converting document 8-K_2025-11-06 in 0.05 sec.


Converted 'data\edgar_documents\SO\8-K_2025-09-15' --> 'data\processed_data\SO\8-K_2025-09-15.md'
Converted 'data\edgar_documents\SO\8-K_2025-10-30' --> 'data\processed_data\SO\8-K_2025-10-30.md'


2025-11-14 17:36:43,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\8-K_2025-11-06' --> 'data\processed_data\SO\8-K_2025-11-06.md'


2025-11-14 17:36:44,771 - INFO - Going to convert document batch...
2025-11-14 17:36:44,772 - INFO - Processing document DEF-14A_2023-04-14
2025-11-14 17:37:07,275 - INFO - Finished converting document DEF-14A_2023-04-14 in 23.41 sec.
2025-11-14 17:37:08,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\DEF-14A_2023-04-14' --> 'data\processed_data\SO\DEF-14A_2023-04-14.md'


2025-11-14 17:37:09,552 - INFO - Going to convert document batch...
2025-11-14 17:37:09,554 - INFO - Processing document DEF-14A_2024-04-12
2025-11-14 17:37:19,406 - INFO - Finished converting document DEF-14A_2024-04-12 in 10.69 sec.
2025-11-14 17:37:20,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\DEF-14A_2024-04-12' --> 'data\processed_data\SO\DEF-14A_2024-04-12.md'


2025-11-14 17:37:21,350 - INFO - Going to convert document batch...
2025-11-14 17:37:21,351 - INFO - Processing document DEF-14A_2025-04-11
2025-11-14 17:37:24,939 - INFO - Finished converting document DEF-14A_2025-04-11 in 4.61 sec.
2025-11-14 17:37:26,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SO\DEF-14A_2025-04-11' --> 'data\processed_data\SO\DEF-14A_2025-04-11.md'
Processed 148 new files. Errors: 14
Found 81 files to process in data\edgar_documents\SPG


2025-11-14 17:37:28,926 - INFO - Going to convert document batch...
2025-11-14 17:37:28,927 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:37:28,928 - INFO - Processing document 10-K_2023-02-23
2025-11-14 17:37:41,181 - INFO - Finished converting document 10-K_2023-02-23 in 15.11 sec.


Converted 'data\edgar_documents\SPG\10-K_2023-02-23' --> 'data\processed_data\SPG\10-K_2023-02-23.md'


2025-11-14 17:37:42,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:37:45,116 - INFO - Going to convert document batch...
2025-11-14 17:37:45,117 - INFO - Processing document 10-K_2024-02-22
2025-11-14 17:37:56,525 - INFO - Finished converting document 10-K_2024-02-22 in 14.17 sec.


Converted 'data\edgar_documents\SPG\10-K_2024-02-22' --> 'data\processed_data\SPG\10-K_2024-02-22.md'


2025-11-14 17:37:57,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:01,635 - INFO - Going to convert document batch...
2025-11-14 17:38:01,635 - INFO - Processing document 10-K_2025-02-21
2025-11-14 17:38:13,847 - INFO - Finished converting document 10-K_2025-02-21 in 16.17 sec.
2025-11-14 17:38:15,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\10-K_2025-02-21' --> 'data\processed_data\SPG\10-K_2025-02-21.md'


2025-11-14 17:38:16,672 - INFO - Going to convert document batch...
2025-11-14 17:38:16,672 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 17:38:18,370 - INFO - Finished converting document 10-Q_2023-05-04 in 3.36 sec.
2025-11-14 17:38:18,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\10-Q_2023-05-04' --> 'data\processed_data\SPG\10-Q_2023-05-04.md'


2025-11-14 17:38:19,642 - INFO - Going to convert document batch...
2025-11-14 17:38:19,643 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 17:38:22,883 - INFO - Finished converting document 10-Q_2023-08-03 in 4.09 sec.
2025-11-14 17:38:23,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\10-Q_2023-08-03' --> 'data\processed_data\SPG\10-Q_2023-08-03.md'


2025-11-14 17:38:24,332 - INFO - Going to convert document batch...
2025-11-14 17:38:24,333 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 17:38:27,351 - INFO - Finished converting document 10-Q_2023-11-02 in 3.95 sec.
2025-11-14 17:38:27,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\10-Q_2023-11-02' --> 'data\processed_data\SPG\10-Q_2023-11-02.md'


2025-11-14 17:38:28,561 - INFO - Going to convert document batch...
2025-11-14 17:38:28,562 - INFO - Processing document 10-Q_2024-05-07
2025-11-14 17:38:30,451 - INFO - Finished converting document 10-Q_2024-05-07 in 2.55 sec.
2025-11-14 17:38:30,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\10-Q_2024-05-07' --> 'data\processed_data\SPG\10-Q_2024-05-07.md'


2025-11-14 17:38:32,296 - INFO - Going to convert document batch...
2025-11-14 17:38:32,296 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 17:38:34,849 - INFO - Finished converting document 10-Q_2024-08-07 in 3.99 sec.
2025-11-14 17:38:35,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\10-Q_2024-08-07' --> 'data\processed_data\SPG\10-Q_2024-08-07.md'


2025-11-14 17:38:36,774 - INFO - Going to convert document batch...
2025-11-14 17:38:36,776 - INFO - Processing document 10-Q_2024-11-08
2025-11-14 17:38:39,859 - INFO - Finished converting document 10-Q_2024-11-08 in 4.11 sec.
2025-11-14 17:38:40,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\10-Q_2024-11-08' --> 'data\processed_data\SPG\10-Q_2024-11-08.md'


2025-11-14 17:38:41,103 - INFO - Going to convert document batch...
2025-11-14 17:38:41,104 - INFO - Processing document 10-Q_2025-05-12
2025-11-14 17:38:43,154 - INFO - Finished converting document 10-Q_2025-05-12 in 2.72 sec.


Converted 'data\edgar_documents\SPG\10-Q_2025-05-12' --> 'data\processed_data\SPG\10-Q_2025-05-12.md'


2025-11-14 17:38:43,889 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:45,331 - INFO - Going to convert document batch...
2025-11-14 17:38:45,331 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 17:38:48,539 - INFO - Finished converting document 10-Q_2025-08-07 in 4.94 sec.
2025-11-14 17:38:49,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\10-Q_2025-08-07' --> 'data\processed_data\SPG\10-Q_2025-08-07.md'


2025-11-14 17:38:50,750 - INFO - Going to convert document batch...
2025-11-14 17:38:50,751 - INFO - Processing document 10-Q_2025-11-06
2025-11-14 17:38:53,743 - INFO - Finished converting document 10-Q_2025-11-06 in 4.61 sec.
2025-11-14 17:38:54,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:54,417 - INFO - Going to convert document batch...
2025-11-14 17:38:54,418 - INFO - Processing document 4_2023-01-03
2025-11-14 17:38:54,436 - INFO - Finished converting document 4_2023-01-03 in 0.06 sec.
2025-11-14 17:38:54,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:54,511 - INFO - Going to convert document batch...
2025-11-14 17:38:54,512 - INFO - Processing document 4_2023-01-04
2025-11-14 17:38:54,531 - INFO - Finished converting document 4_2023-01-04 in 0.06 sec.


Converted 'data\edgar_documents\SPG\10-Q_2025-11-06' --> 'data\processed_data\SPG\10-Q_2025-11-06.md'
Converted 'data\edgar_documents\SPG\4_2023-01-03' --> 'data\processed_data\SPG\4_2023-01-03.md'
Converted 'data\edgar_documents\SPG\4_2023-01-04' --> 'data\processed_data\SPG\4_2023-01-04.md'


2025-11-14 17:38:54,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:54,596 - INFO - Going to convert document batch...
2025-11-14 17:38:54,597 - INFO - Processing document 4_2023-03-03
2025-11-14 17:38:54,616 - INFO - Finished converting document 4_2023-03-03 in 0.06 sec.
2025-11-14 17:38:54,648 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:54,657 - INFO - Going to convert document batch...
2025-11-14 17:38:54,659 - INFO - Processing document 4_2023-03-30
2025-11-14 17:38:54,678 - INFO - Finished converting document 4_2023-03-30 in 0.03 sec.
2025-11-14 17:38:54,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:54,729 - INFO - Going to convert document batch...
2025-11-14 17:38:54,731 - INFO - Processing document 4_2023-04-03
2025-11-14 17:38:54,757 - INFO - Finished converting document 4_2023-04-03 in 0.05 sec.
2025-11-14 17:38:54,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\SPG\4_2023-03-03' --> 'data\processed_data\SPG\4_2023-03-03.md'
Converted 'data\edgar_documents\SPG\4_2023-03-30' --> 'data\processed_data\SPG\4_2023-03-30.md'
Converted 'data\edgar_documents\SPG\4_2023-04-03' --> 'data\processed_data\SPG\4_2023-04-03.md'


2025-11-14 17:38:54,842 - INFO - Finished converting document 4_2023-04-04 in 0.06 sec.
2025-11-14 17:38:54,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:54,893 - INFO - Going to convert document batch...
2025-11-14 17:38:54,894 - INFO - Processing document 4_2023-05-05
2025-11-14 17:38:54,930 - INFO - Finished converting document 4_2023-05-05 in 0.06 sec.
2025-11-14 17:38:54,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:54,978 - INFO - Going to convert document batch...
2025-11-14 17:38:54,979 - INFO - Processing document 4_2023-07-05
2025-11-14 17:38:55,004 - INFO - Finished converting document 4_2023-07-05 in 0.05 sec.
2025-11-14 17:38:55,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\4_2023-04-04' --> 'data\processed_data\SPG\4_2023-04-04.md'
Converted 'data\edgar_documents\SPG\4_2023-05-05' --> 'data\processed_data\SPG\4_2023-05-05.md'
Converted 'data\edgar_documents\SPG\4_2023-07-05' --> 'data\processed_data\SPG\4_2023-07-05.md'


2025-11-14 17:38:55,049 - INFO - Going to convert document batch...
2025-11-14 17:38:55,049 - INFO - Processing document 4_2023-10-03
2025-11-14 17:38:55,070 - INFO - Finished converting document 4_2023-10-03 in 0.03 sec.
2025-11-14 17:38:55,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,127 - INFO - Going to convert document batch...
2025-11-14 17:38:55,129 - INFO - Processing document 4_2023-12-18
2025-11-14 17:38:55,161 - INFO - Finished converting document 4_2023-12-18 in 0.06 sec.
2025-11-14 17:38:55,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,217 - INFO - Going to convert document batch...
2025-11-14 17:38:55,218 - INFO - Processing document 4_2024-01-02
2025-11-14 17:38:55,241 - INFO - Finished converting document 4_2024-01-02 in 0.06 sec.
2025-11-14 17:38:55,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,283 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\SPG\4_2023-10-03' --> 'data\processed_data\SPG\4_2023-10-03.md'
Converted 'data\edgar_documents\SPG\4_2023-12-18' --> 'data\processed_data\SPG\4_2023-12-18.md'
Converted 'data\edgar_documents\SPG\4_2024-01-02' --> 'data\processed_data\SPG\4_2024-01-02.md'


2025-11-14 17:38:55,284 - INFO - Processing document 4_2024-01-03
2025-11-14 17:38:55,306 - INFO - Finished converting document 4_2024-01-03 in 0.03 sec.
2025-11-14 17:38:55,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,350 - INFO - Going to convert document batch...
2025-11-14 17:38:55,351 - INFO - Processing document 4_2024-01-11
2025-11-14 17:38:55,370 - INFO - Finished converting document 4_2024-01-11 in 0.05 sec.
2025-11-14 17:38:55,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,410 - INFO - Going to convert document batch...
2025-11-14 17:38:55,411 - INFO - Processing document 4_2024-03-04
2025-11-14 17:38:55,431 - INFO - Finished converting document 4_2024-03-04 in 0.03 sec.
2025-11-14 17:38:55,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,473 - INFO - Going to convert document batch...
2025-11-14 17:38:55,475 - INFO - Processing document 4_2024-03-08
2025-11-14 17:38:55,495 - IN

Converted 'data\edgar_documents\SPG\4_2024-01-03' --> 'data\processed_data\SPG\4_2024-01-03.md'
Converted 'data\edgar_documents\SPG\4_2024-01-11' --> 'data\processed_data\SPG\4_2024-01-11.md'
Converted 'data\edgar_documents\SPG\4_2024-03-04' --> 'data\processed_data\SPG\4_2024-03-04.md'
Converted 'data\edgar_documents\SPG\4_2024-03-08' --> 'data\processed_data\SPG\4_2024-03-08.md'


2025-11-14 17:38:55,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,552 - INFO - Going to convert document batch...
2025-11-14 17:38:55,553 - INFO - Processing document 4_2024-03-25
2025-11-14 17:38:55,571 - INFO - Finished converting document 4_2024-03-25 in 0.05 sec.
2025-11-14 17:38:55,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,613 - INFO - Going to convert document batch...
2025-11-14 17:38:55,613 - INFO - Processing document 4_2024-04-02
2025-11-14 17:38:55,633 - INFO - Finished converting document 4_2024-04-02 in 0.03 sec.
2025-11-14 17:38:55,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,672 - INFO - Going to convert document batch...
2025-11-14 17:38:55,673 - INFO - Processing document 4_2024-04-03
2025-11-14 17:38:55,693 - INFO - Finished converting document 4_2024-04-03 in 0.03 sec.
2025-11-14 17:38:55,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\SPG\4_2024-03-25' --> 'data\processed_data\SPG\4_2024-03-25.md'
Converted 'data\edgar_documents\SPG\4_2024-04-02' --> 'data\processed_data\SPG\4_2024-04-02.md'
Converted 'data\edgar_documents\SPG\4_2024-04-03' --> 'data\processed_data\SPG\4_2024-04-03.md'
Converted 'data\edgar_documents\SPG\4_2024-05-09' --> 'data\processed_data\SPG\4_2024-05-09.md'


2025-11-14 17:38:55,811 - INFO - Going to convert document batch...
2025-11-14 17:38:55,812 - INFO - Processing document 4_2024-07-02
2025-11-14 17:38:55,833 - INFO - Finished converting document 4_2024-07-02 in 0.05 sec.
2025-11-14 17:38:55,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,882 - INFO - Going to convert document batch...
2025-11-14 17:38:55,883 - INFO - Processing document 4_2024-08-30
2025-11-14 17:38:55,902 - INFO - Finished converting document 4_2024-08-30 in 0.05 sec.
2025-11-14 17:38:55,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,941 - INFO - Going to convert document batch...
2025-11-14 17:38:55,942 - INFO - Processing document 4_2024-10-01
2025-11-14 17:38:55,959 - INFO - Finished converting document 4_2024-10-01 in 0.03 sec.
2025-11-14 17:38:55,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:55,998 - INFO - Going to convert document batch...
2025-11-14 17:38:55,998 - 

Converted 'data\edgar_documents\SPG\4_2024-07-02' --> 'data\processed_data\SPG\4_2024-07-02.md'
Converted 'data\edgar_documents\SPG\4_2024-08-30' --> 'data\processed_data\SPG\4_2024-08-30.md'
Converted 'data\edgar_documents\SPG\4_2024-10-01' --> 'data\processed_data\SPG\4_2024-10-01.md'
Converted 'data\edgar_documents\SPG\4_2024-12-10' --> 'data\processed_data\SPG\4_2024-12-10.md'


2025-11-14 17:38:56,054 - INFO - Going to convert document batch...
2025-11-14 17:38:56,054 - INFO - Processing document 4_2024-12-26
2025-11-14 17:38:56,080 - INFO - Finished converting document 4_2024-12-26 in 0.05 sec.
2025-11-14 17:38:56,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,119 - INFO - Going to convert document batch...
2025-11-14 17:38:56,120 - INFO - Processing document 4_2025-01-02
2025-11-14 17:38:56,140 - INFO - Finished converting document 4_2025-01-02 in 0.05 sec.
2025-11-14 17:38:56,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,191 - INFO - Going to convert document batch...
2025-11-14 17:38:56,192 - INFO - Processing document 4_2025-03-05
2025-11-14 17:38:56,210 - INFO - Finished converting document 4_2025-03-05 in 0.05 sec.
2025-11-14 17:38:56,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,250 - INFO - Going to convert document batch...
2025-11-14 17:38:56,250 - 

Converted 'data\edgar_documents\SPG\4_2024-12-26' --> 'data\processed_data\SPG\4_2024-12-26.md'
Converted 'data\edgar_documents\SPG\4_2025-01-02' --> 'data\processed_data\SPG\4_2025-01-02.md'
Converted 'data\edgar_documents\SPG\4_2025-03-05' --> 'data\processed_data\SPG\4_2025-03-05.md'


2025-11-14 17:38:56,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,315 - INFO - Going to convert document batch...
2025-11-14 17:38:56,316 - INFO - Processing document 4_2025-03-20
2025-11-14 17:38:56,338 - INFO - Finished converting document 4_2025-03-20 in 0.05 sec.
2025-11-14 17:38:56,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,381 - INFO - Going to convert document batch...
2025-11-14 17:38:56,381 - INFO - Processing document 4_2025-03-27
2025-11-14 17:38:56,400 - INFO - Finished converting document 4_2025-03-27 in 0.03 sec.
2025-11-14 17:38:56,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,441 - INFO - Going to convert document batch...
2025-11-14 17:38:56,442 - INFO - Processing document 4_2025-04-02
2025-11-14 17:38:56,461 - INFO - Finished converting document 4_2025-04-02 in 0.03 sec.


Converted 'data\edgar_documents\SPG\4_2025-03-13' --> 'data\processed_data\SPG\4_2025-03-13.md'
Converted 'data\edgar_documents\SPG\4_2025-03-20' --> 'data\processed_data\SPG\4_2025-03-20.md'
Converted 'data\edgar_documents\SPG\4_2025-03-27' --> 'data\processed_data\SPG\4_2025-03-27.md'


2025-11-14 17:38:56,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,501 - INFO - Going to convert document batch...
2025-11-14 17:38:56,503 - INFO - Processing document 4_2025-04-03
2025-11-14 17:38:56,525 - INFO - Finished converting document 4_2025-04-03 in 0.03 sec.
2025-11-14 17:38:56,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,577 - INFO - Going to convert document batch...
2025-11-14 17:38:56,578 - INFO - Processing document 4_2025-05-16
2025-11-14 17:38:56,596 - INFO - Finished converting document 4_2025-05-16 in 0.05 sec.
2025-11-14 17:38:56,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,652 - INFO - Going to convert document batch...
2025-11-14 17:38:56,653 - INFO - Processing document 4_2025-06-16
2025-11-14 17:38:56,671 - INFO - Finished converting document 4_2025-06-16 in 0.06 sec.


Converted 'data\edgar_documents\SPG\4_2025-04-02' --> 'data\processed_data\SPG\4_2025-04-02.md'
Converted 'data\edgar_documents\SPG\4_2025-04-03' --> 'data\processed_data\SPG\4_2025-04-03.md'
Converted 'data\edgar_documents\SPG\4_2025-05-16' --> 'data\processed_data\SPG\4_2025-05-16.md'


2025-11-14 17:38:56,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,709 - INFO - Going to convert document batch...
2025-11-14 17:38:56,710 - INFO - Processing document 4_2025-06-30
2025-11-14 17:38:56,728 - INFO - Finished converting document 4_2025-06-30 in 0.03 sec.
2025-11-14 17:38:56,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,773 - INFO - Going to convert document batch...
2025-11-14 17:38:56,775 - INFO - Processing document 4_2025-07-01
2025-11-14 17:38:56,796 - INFO - Finished converting document 4_2025-07-01 in 0.05 sec.
2025-11-14 17:38:56,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,834 - INFO - Going to convert document batch...
2025-11-14 17:38:56,835 - INFO - Processing document 4_2025-08-15
2025-11-14 17:38:56,853 - INFO - Finished converting document 4_2025-08-15 in 0.03 sec.


Converted 'data\edgar_documents\SPG\4_2025-06-16' --> 'data\processed_data\SPG\4_2025-06-16.md'
Converted 'data\edgar_documents\SPG\4_2025-06-30' --> 'data\processed_data\SPG\4_2025-06-30.md'
Converted 'data\edgar_documents\SPG\4_2025-07-01' --> 'data\processed_data\SPG\4_2025-07-01.md'


2025-11-14 17:38:56,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,892 - INFO - Going to convert document batch...
2025-11-14 17:38:56,893 - INFO - Processing document 4_2025-09-02
2025-11-14 17:38:56,912 - INFO - Finished converting document 4_2025-09-02 in 0.03 sec.
2025-11-14 17:38:56,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:56,984 - INFO - Going to convert document batch...
2025-11-14 17:38:56,986 - INFO - Processing document 4_2025-10-01
2025-11-14 17:38:57,005 - INFO - Finished converting document 4_2025-10-01 in 0.05 sec.
2025-11-14 17:38:57,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\4_2025-08-15' --> 'data\processed_data\SPG\4_2025-08-15.md'
Converted 'data\edgar_documents\SPG\4_2025-09-02' --> 'data\processed_data\SPG\4_2025-09-02.md'
Converted 'data\edgar_documents\SPG\4_2025-10-01' --> 'data\processed_data\SPG\4_2025-10-01.md'


2025-11-14 17:38:57,082 - INFO - Going to convert document batch...
2025-11-14 17:38:57,082 - INFO - Processing document 8-K_2023-02-06
2025-11-14 17:38:57,110 - INFO - Finished converting document 8-K_2023-02-06 in 0.09 sec.
2025-11-14 17:38:57,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,157 - INFO - Going to convert document batch...
2025-11-14 17:38:57,158 - INFO - Processing document 8-K_2023-03-15
2025-11-14 17:38:57,184 - INFO - Finished converting document 8-K_2023-03-15 in 0.06 sec.
2025-11-14 17:38:57,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,227 - INFO - Going to convert document batch...
2025-11-14 17:38:57,228 - INFO - Processing document 8-K_2023-03-23
2025-11-14 17:38:57,249 - INFO - Finished converting document 8-K_2023-03-23 in 0.05 sec.
2025-11-14 17:38:57,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,291 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SPG\8-K_2023-02-06' --> 'data\processed_data\SPG\8-K_2023-02-06.md'
Converted 'data\edgar_documents\SPG\8-K_2023-03-15' --> 'data\processed_data\SPG\8-K_2023-03-15.md'
Converted 'data\edgar_documents\SPG\8-K_2023-03-23' --> 'data\processed_data\SPG\8-K_2023-03-23.md'


2025-11-14 17:38:57,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,361 - INFO - Going to convert document batch...
2025-11-14 17:38:57,362 - INFO - Processing document 8-K_2023-05-05
2025-11-14 17:38:57,404 - INFO - Finished converting document 8-K_2023-05-05 in 0.08 sec.
2025-11-14 17:38:57,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,477 - INFO - Going to convert document batch...
2025-11-14 17:38:57,478 - INFO - Processing document 8-K_2023-08-02
2025-11-14 17:38:57,509 - INFO - Finished converting document 8-K_2023-08-02 in 0.08 sec.


Converted 'data\edgar_documents\SPG\8-K_2023-05-02' --> 'data\processed_data\SPG\8-K_2023-05-02.md'
Converted 'data\edgar_documents\SPG\8-K_2023-05-05' --> 'data\processed_data\SPG\8-K_2023-05-05.md'


2025-11-14 17:38:57,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,559 - INFO - Going to convert document batch...
2025-11-14 17:38:57,561 - INFO - Processing document 8-K_2023-10-30
2025-11-14 17:38:57,593 - INFO - Finished converting document 8-K_2023-10-30 in 0.06 sec.
2025-11-14 17:38:57,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,664 - INFO - Going to convert document batch...
2025-11-14 17:38:57,664 - INFO - Processing document 8-K_2023-11-08
2025-11-14 17:38:57,691 - INFO - Finished converting document 8-K_2023-11-08 in 0.08 sec.


Converted 'data\edgar_documents\SPG\8-K_2023-08-02' --> 'data\processed_data\SPG\8-K_2023-08-02.md'
Converted 'data\edgar_documents\SPG\8-K_2023-10-30' --> 'data\processed_data\SPG\8-K_2023-10-30.md'
Converted 'data\edgar_documents\SPG\8-K_2023-11-08' --> 'data\processed_data\SPG\8-K_2023-11-08.md'


2025-11-14 17:38:57,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,741 - INFO - Going to convert document batch...
2025-11-14 17:38:57,742 - INFO - Processing document 8-K_2023-11-09
2025-11-14 17:38:57,771 - INFO - Finished converting document 8-K_2023-11-09 in 0.05 sec.
2025-11-14 17:38:57,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,827 - INFO - Going to convert document batch...
2025-11-14 17:38:57,828 - INFO - Processing document 8-K_2024-01-09
2025-11-14 17:38:57,848 - INFO - Finished converting document 8-K_2024-01-09 in 0.05 sec.
2025-11-14 17:38:57,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:57,889 - INFO - Going to convert document batch...
2025-11-14 17:38:57,890 - INFO - Processing document 8-K_2024-02-05
2025-11-14 17:38:57,913 - INFO - Finished converting document 8-K_2024-02-05 in 0.05 sec.
2025-11-14 17:38:57,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\SPG\8-K_2023-11-09' --> 'data\processed_data\SPG\8-K_2023-11-09.md'
Converted 'data\edgar_documents\SPG\8-K_2024-01-09' --> 'data\processed_data\SPG\8-K_2024-01-09.md'
Converted 'data\edgar_documents\SPG\8-K_2024-02-05' --> 'data\processed_data\SPG\8-K_2024-02-05.md'


2025-11-14 17:38:57,986 - INFO - Processing document 8-K_2024-02-08
2025-11-14 17:38:58,007 - INFO - Finished converting document 8-K_2024-02-08 in 0.06 sec.
2025-11-14 17:38:58,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:58,050 - INFO - Going to convert document batch...
2025-11-14 17:38:58,052 - INFO - Processing document 8-K_2024-02-09
2025-11-14 17:38:58,091 - INFO - Finished converting document 8-K_2024-02-09 in 0.08 sec.
2025-11-14 17:38:58,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:58,141 - INFO - Going to convert document batch...
2025-11-14 17:38:58,142 - INFO - Processing document 8-K_2024-05-06
2025-11-14 17:38:58,165 - INFO - Finished converting document 8-K_2024-05-06 in 0.05 sec.
2025-11-14 17:38:58,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\8-K_2024-02-08' --> 'data\processed_data\SPG\8-K_2024-02-08.md'
Converted 'data\edgar_documents\SPG\8-K_2024-02-09' --> 'data\processed_data\SPG\8-K_2024-02-09.md'
Converted 'data\edgar_documents\SPG\8-K_2024-05-06' --> 'data\processed_data\SPG\8-K_2024-05-06.md'


2025-11-14 17:38:58,211 - INFO - Going to convert document batch...
2025-11-14 17:38:58,212 - INFO - Processing document 8-K_2024-05-08
2025-11-14 17:38:58,239 - INFO - Finished converting document 8-K_2024-05-08 in 0.05 sec.
2025-11-14 17:38:58,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:58,281 - INFO - Going to convert document batch...
2025-11-14 17:38:58,282 - INFO - Processing document 8-K_2024-05-29
2025-11-14 17:38:58,300 - INFO - Finished converting document 8-K_2024-05-29 in 0.05 sec.
2025-11-14 17:38:58,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:58,360 - INFO - Going to convert document batch...
2025-11-14 17:38:58,361 - INFO - Processing document 8-K_2024-08-05
2025-11-14 17:38:58,385 - INFO - Finished converting document 8-K_2024-08-05 in 0.06 sec.
2025-11-14 17:38:58,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:58,431 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SPG\8-K_2024-05-08' --> 'data\processed_data\SPG\8-K_2024-05-08.md'
Converted 'data\edgar_documents\SPG\8-K_2024-05-29' --> 'data\processed_data\SPG\8-K_2024-05-29.md'
Converted 'data\edgar_documents\SPG\8-K_2024-08-05' --> 'data\processed_data\SPG\8-K_2024-08-05.md'


2025-11-14 17:38:58,473 - INFO - Finished converting document 8-K_2024-08-30 in 0.06 sec.
2025-11-14 17:38:58,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:58,531 - INFO - Going to convert document batch...
2025-11-14 17:38:58,532 - INFO - Processing document 8-K_2024-09-19
2025-11-14 17:38:58,567 - INFO - Finished converting document 8-K_2024-09-19 in 0.06 sec.
2025-11-14 17:38:58,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\8-K_2024-08-30' --> 'data\processed_data\SPG\8-K_2024-08-30.md'
Converted 'data\edgar_documents\SPG\8-K_2024-09-19' --> 'data\processed_data\SPG\8-K_2024-09-19.md'


2025-11-14 17:38:59,138 - INFO - Going to convert document batch...
2025-11-14 17:38:59,139 - INFO - Processing document 8-K_2024-11-01
2025-11-14 17:38:59,159 - INFO - Finished converting document 8-K_2024-11-01 in 0.56 sec.
2025-11-14 17:38:59,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:59,208 - INFO - Going to convert document batch...
2025-11-14 17:38:59,209 - INFO - Processing document 8-K_2025-02-04
2025-11-14 17:38:59,232 - INFO - Finished converting document 8-K_2025-02-04 in 0.06 sec.
2025-11-14 17:38:59,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:59,272 - INFO - Going to convert document batch...
2025-11-14 17:38:59,273 - INFO - Processing document 8-K_2025-02-06
2025-11-14 17:38:59,291 - INFO - Finished converting document 8-K_2025-02-06 in 0.03 sec.
2025-11-14 17:38:59,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:59,328 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\SPG\8-K_2024-11-01' --> 'data\processed_data\SPG\8-K_2024-11-01.md'
Converted 'data\edgar_documents\SPG\8-K_2025-02-04' --> 'data\processed_data\SPG\8-K_2025-02-04.md'
Converted 'data\edgar_documents\SPG\8-K_2025-02-06' --> 'data\processed_data\SPG\8-K_2025-02-06.md'


2025-11-14 17:38:59,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:59,386 - INFO - Going to convert document batch...
2025-11-14 17:38:59,387 - INFO - Processing document 8-K_2025-05-12
2025-11-14 17:38:59,413 - INFO - Finished converting document 8-K_2025-05-12 in 0.05 sec.
2025-11-14 17:38:59,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:59,479 - INFO - Going to convert document batch...
2025-11-14 17:38:59,480 - INFO - Processing document 8-K_2025-05-15
2025-11-14 17:38:59,539 - INFO - Finished converting document 8-K_2025-05-15 in 0.09 sec.


Converted 'data\edgar_documents\SPG\8-K_2025-03-20' --> 'data\processed_data\SPG\8-K_2025-03-20.md'
Converted 'data\edgar_documents\SPG\8-K_2025-05-12' --> 'data\processed_data\SPG\8-K_2025-05-12.md'
Converted 'data\edgar_documents\SPG\8-K_2025-05-15' --> 'data\processed_data\SPG\8-K_2025-05-15.md'


2025-11-14 17:38:59,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:59,595 - INFO - Going to convert document batch...
2025-11-14 17:38:59,596 - INFO - Processing document 8-K_2025-08-04
2025-11-14 17:38:59,618 - INFO - Finished converting document 8-K_2025-08-04 in 0.05 sec.
2025-11-14 17:38:59,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:59,660 - INFO - Going to convert document batch...
2025-11-14 17:38:59,662 - INFO - Processing document 8-K_2025-08-07
2025-11-14 17:38:59,677 - INFO - Finished converting document 8-K_2025-08-07 in 0.03 sec.
2025-11-14 17:38:59,700 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:38:59,712 - INFO - Going to convert document batch...
2025-11-14 17:38:59,713 - INFO - Processing document 8-K_2025-11-03
2025-11-14 17:38:59,734 - INFO - Finished converting document 8-K_2025-11-03 in 0.05 sec.
2025-11-14 17:38:59,828 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_ja

Converted 'data\edgar_documents\SPG\8-K_2025-08-04' --> 'data\processed_data\SPG\8-K_2025-08-04.md'
Converted 'data\edgar_documents\SPG\8-K_2025-08-07' --> 'data\processed_data\SPG\8-K_2025-08-07.md'
Converted 'data\edgar_documents\SPG\8-K_2025-11-03' --> 'data\processed_data\SPG\8-K_2025-11-03.md'


2025-11-14 17:38:59,829 - ERROR - Input document DEF-14A_2023-03-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:38:59,832 - INFO - Going to convert document batch...
2025-11-14 17:38:59,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\SPG\DEF-14A_2023-03-23: File format not allowed: data\edgar_documents\SPG\DEF-14A_2023-03-23


2025-11-14 17:39:00,682 - INFO - Going to convert document batch...
2025-11-14 17:39:00,683 - INFO - Processing document DEF-14A_2024-03-27
2025-11-14 17:39:04,696 - INFO - Finished converting document DEF-14A_2024-03-27 in 4.86 sec.
2025-11-14 17:39:05,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\DEF-14A_2024-03-27' --> 'data\processed_data\SPG\DEF-14A_2024-03-27.md'


2025-11-14 17:39:06,731 - INFO - Going to convert document batch...
2025-11-14 17:39:06,732 - INFO - Processing document DEF-14A_2025-04-01
2025-11-14 17:39:15,393 - INFO - Finished converting document DEF-14A_2025-04-01 in 10.11 sec.
2025-11-14 17:39:17,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\SPG\DEF-14A_2025-04-01' --> 'data\processed_data\SPG\DEF-14A_2025-04-01.md'
Processed 80 new files. Errors: 1
Found 140 files to process in data\edgar_documents\T


2025-11-14 17:39:18,734 - INFO - Going to convert document batch...
2025-11-14 17:39:18,734 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:39:18,735 - INFO - Processing document 10-K_2023-02-13
2025-11-14 17:39:22,241 - INFO - Finished converting document 10-K_2023-02-13 in 5.14 sec.
2025-11-14 17:39:23,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-K_2023-02-13' --> 'data\processed_data\T\10-K_2023-02-13.md'


2025-11-14 17:39:24,785 - INFO - Going to convert document batch...
2025-11-14 17:39:24,786 - INFO - Processing document 10-K_2024-02-23
2025-11-14 17:39:28,017 - INFO - Finished converting document 10-K_2024-02-23 in 4.67 sec.
2025-11-14 17:39:29,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-K_2024-02-23' --> 'data\processed_data\T\10-K_2024-02-23.md'


2025-11-14 17:39:30,726 - INFO - Going to convert document batch...
2025-11-14 17:39:30,727 - INFO - Processing document 10-K_2025-02-12
2025-11-14 17:39:33,612 - INFO - Finished converting document 10-K_2025-02-12 in 4.50 sec.
2025-11-14 17:39:34,711 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-K_2025-02-12' --> 'data\processed_data\T\10-K_2025-02-12.md'


2025-11-14 17:39:35,737 - INFO - Going to convert document batch...
2025-11-14 17:39:35,737 - INFO - Processing document 10-Q_2023-05-01
2025-11-14 17:39:36,531 - INFO - Finished converting document 10-Q_2023-05-01 in 1.88 sec.
2025-11-14 17:39:37,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-Q_2023-05-01' --> 'data\processed_data\T\10-Q_2023-05-01.md'


2025-11-14 17:39:38,164 - INFO - Going to convert document batch...
2025-11-14 17:39:38,165 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 17:39:39,207 - INFO - Finished converting document 10-Q_2023-07-27 in 2.22 sec.
2025-11-14 17:39:39,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-Q_2023-07-27' --> 'data\processed_data\T\10-Q_2023-07-27.md'


2025-11-14 17:39:40,501 - INFO - Going to convert document batch...
2025-11-14 17:39:40,502 - INFO - Processing document 10-Q_2023-10-31
2025-11-14 17:39:42,019 - INFO - Finished converting document 10-Q_2023-10-31 in 2.17 sec.
2025-11-14 17:39:42,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-Q_2023-10-31' --> 'data\processed_data\T\10-Q_2023-10-31.md'


2025-11-14 17:39:43,044 - INFO - Going to convert document batch...
2025-11-14 17:39:43,045 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 17:39:43,837 - INFO - Finished converting document 10-Q_2024-05-02 in 1.22 sec.
2025-11-14 17:39:44,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-Q_2024-05-02' --> 'data\processed_data\T\10-Q_2024-05-02.md'


2025-11-14 17:39:45,316 - INFO - Going to convert document batch...
2025-11-14 17:39:45,317 - INFO - Processing document 10-Q_2024-07-25
2025-11-14 17:39:46,304 - INFO - Finished converting document 10-Q_2024-07-25 in 2.02 sec.
2025-11-14 17:39:46,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-Q_2024-07-25' --> 'data\processed_data\T\10-Q_2024-07-25.md'


2025-11-14 17:39:47,805 - INFO - Going to convert document batch...
2025-11-14 17:39:47,806 - INFO - Processing document 10-Q_2024-10-29
2025-11-14 17:39:48,810 - INFO - Finished converting document 10-Q_2024-10-29 in 1.95 sec.
2025-11-14 17:39:49,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-Q_2024-10-29' --> 'data\processed_data\T\10-Q_2024-10-29.md'


2025-11-14 17:39:49,890 - INFO - Going to convert document batch...
2025-11-14 17:39:49,890 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 17:39:50,667 - INFO - Finished converting document 10-Q_2025-04-29 in 1.28 sec.
2025-11-14 17:39:51,161 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-Q_2025-04-29' --> 'data\processed_data\T\10-Q_2025-04-29.md'


2025-11-14 17:39:52,124 - INFO - Going to convert document batch...
2025-11-14 17:39:52,125 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 17:39:53,166 - INFO - Finished converting document 10-Q_2025-07-24 in 2.03 sec.
2025-11-14 17:39:53,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-Q_2025-07-24' --> 'data\processed_data\T\10-Q_2025-07-24.md'


2025-11-14 17:39:54,739 - INFO - Going to convert document batch...
2025-11-14 17:39:54,739 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 17:39:55,753 - INFO - Finished converting document 10-Q_2025-10-31 in 1.95 sec.
2025-11-14 17:39:56,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:56,372 - INFO - Going to convert document batch...
2025-11-14 17:39:56,372 - INFO - Processing document 4_2023-01-04
2025-11-14 17:39:56,392 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 17:39:56,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:56,445 - INFO - Going to convert document batch...
2025-11-14 17:39:56,446 - INFO - Processing document 4_2023-01-18
2025-11-14 17:39:56,488 - INFO - Finished converting document 4_2023-01-18 in 0.06 sec.
2025-11-14 17:39:56,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\10-Q_2025-10-31' --> 'data\processed_data\T\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\T\4_2023-01-04' --> 'data\processed_data\T\4_2023-01-04.md'
Converted 'data\edgar_documents\T\4_2023-01-18' --> 'data\processed_data\T\4_2023-01-18.md'


2025-11-14 17:39:56,569 - INFO - Going to convert document batch...
2025-11-14 17:39:56,570 - INFO - Processing document 4_2023-01-30
2025-11-14 17:39:56,606 - INFO - Finished converting document 4_2023-01-30 in 0.08 sec.
2025-11-14 17:39:56,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:56,675 - INFO - Going to convert document batch...
2025-11-14 17:39:56,676 - INFO - Processing document 4_2023-02-02
2025-11-14 17:39:56,696 - INFO - Finished converting document 4_2023-02-02 in 0.03 sec.
2025-11-14 17:39:56,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:56,735 - INFO - Going to convert document batch...
2025-11-14 17:39:56,736 - INFO - Processing document 4_2023-02-16
2025-11-14 17:39:56,757 - INFO - Finished converting document 4_2023-02-16 in 0.03 sec.
2025-11-14 17:39:56,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:56,801 - INFO - Going to convert document batch...
2025-11-14 17:39:56,802 - 

Converted 'data\edgar_documents\T\4_2023-01-30' --> 'data\processed_data\T\4_2023-01-30.md'
Converted 'data\edgar_documents\T\4_2023-02-02' --> 'data\processed_data\T\4_2023-02-02.md'
Converted 'data\edgar_documents\T\4_2023-02-16' --> 'data\processed_data\T\4_2023-02-16.md'
Converted 'data\edgar_documents\T\4_2023-02-17' --> 'data\processed_data\T\4_2023-02-17.md'


2025-11-14 17:39:56,900 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:39:56,901 - ERROR - Input document 4_2023-02-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:39:56,902 - INFO - Going to convert document batch...
2025-11-14 17:39:56,925 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:39:56,926 - ERROR - Input document 4_2023-03-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\T\4_2023-02-21: File format not allowed: data\edgar_documents\T\4_2023-02-21
Error processing data\edgar_documents\T\4_2023-03-01: File format not allowed: data\edgar_documents\T\4_2023-03-01
Converted 'data\edgar_documents\T\4_2023-03-02' --> 'data\processed_data\T\4_2023-03-02.md'
Converted 'data\edgar_documents\T\4_2023-03-03' --> 'data\processed_data\T\4_2023-03-03.md'


2025-11-14 17:39:57,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:57,135 - INFO - Going to convert document batch...
2025-11-14 17:39:57,136 - INFO - Processing document 4_2023-04-04
2025-11-14 17:39:57,157 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.
2025-11-14 17:39:57,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:57,234 - INFO - Going to convert document batch...
2025-11-14 17:39:57,235 - INFO - Processing document 4_2023-04-25
2025-11-14 17:39:57,255 - INFO - Finished converting document 4_2023-04-25 in 0.05 sec.
2025-11-14 17:39:57,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\4_2023-03-14' --> 'data\processed_data\T\4_2023-03-14.md'
Converted 'data\edgar_documents\T\4_2023-04-04' --> 'data\processed_data\T\4_2023-04-04.md'
Converted 'data\edgar_documents\T\4_2023-04-25' --> 'data\processed_data\T\4_2023-04-25.md'


2025-11-14 17:39:57,302 - INFO - Going to convert document batch...
2025-11-14 17:39:57,303 - INFO - Processing document 4_2023-05-01
2025-11-14 17:39:57,325 - INFO - Finished converting document 4_2023-05-01 in 0.05 sec.
2025-11-14 17:39:57,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:57,373 - INFO - Going to convert document batch...
2025-11-14 17:39:57,374 - INFO - Processing document 4_2023-05-02
2025-11-14 17:39:57,392 - INFO - Finished converting document 4_2023-05-02 in 0.05 sec.
2025-11-14 17:39:57,436 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:39:57,437 - ERROR - Input document 4_2023-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\T\4_2023-05-01' --> 'data\processed_data\T\4_2023-05-01.md'
Converted 'data\edgar_documents\T\4_2023-05-02' --> 'data\processed_data\T\4_2023-05-02.md'
Error processing data\edgar_documents\T\4_2023-05-15: File format not allowed: data\edgar_documents\T\4_2023-05-15
Converted 'data\edgar_documents\T\4_2023-05-22' --> 'data\processed_data\T\4_2023-05-22.md'


2025-11-14 17:39:57,548 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:39:57,549 - ERROR - Input document 4_2023-06-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:39:57,552 - INFO - Going to convert document batch...
2025-11-14 17:39:57,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:57,577 - INFO - Going to convert document batch...
2025-11-14 17:39:57,578 - INFO - Processing document 4_2023-06-02
2025-11-14 17:39:57,600 - INFO - Fin

Error processing data\edgar_documents\T\4_2023-06-01: File format not allowed: data\edgar_documents\T\4_2023-06-01
Converted 'data\edgar_documents\T\4_2023-06-02' --> 'data\processed_data\T\4_2023-06-02.md'
Converted 'data\edgar_documents\T\4_2023-06-20' --> 'data\processed_data\T\4_2023-06-20.md'


2025-11-14 17:39:57,743 - INFO - Processing document 4_2023-07-05
2025-11-14 17:39:57,765 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 17:39:57,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:57,813 - INFO - Going to convert document batch...
2025-11-14 17:39:57,814 - INFO - Processing document 4_2023-08-02
2025-11-14 17:39:57,834 - INFO - Finished converting document 4_2023-08-02 in 0.03 sec.
2025-11-14 17:39:57,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:57,878 - INFO - Going to convert document batch...
2025-11-14 17:39:57,879 - INFO - Processing document 4_2023-08-21
2025-11-14 17:39:57,899 - INFO - Finished converting document 4_2023-08-21 in 0.03 sec.
2025-11-14 17:39:57,932 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:57,941 - INFO - Going to convert document batch...
2025-11-14 17:39:57,942 - INFO - Processing document 4_2023-09-05
2025-11-14 17:39:57,963 - IN

Converted 'data\edgar_documents\T\4_2023-07-05' --> 'data\processed_data\T\4_2023-07-05.md'
Converted 'data\edgar_documents\T\4_2023-08-02' --> 'data\processed_data\T\4_2023-08-02.md'
Converted 'data\edgar_documents\T\4_2023-08-21' --> 'data\processed_data\T\4_2023-08-21.md'
Converted 'data\edgar_documents\T\4_2023-09-05' --> 'data\processed_data\T\4_2023-09-05.md'


2025-11-14 17:39:58,004 - INFO - Going to convert document batch...
2025-11-14 17:39:58,005 - INFO - Processing document 4_2023-10-02
2025-11-14 17:39:58,026 - INFO - Finished converting document 4_2023-10-02 in 0.05 sec.
2025-11-14 17:39:58,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:58,073 - INFO - Going to convert document batch...
2025-11-14 17:39:58,074 - INFO - Processing document 4_2023-11-02


Converted 'data\edgar_documents\T\4_2023-10-02' --> 'data\processed_data\T\4_2023-10-02.md'


2025-11-14 17:39:58,523 - INFO - Finished converting document 4_2023-11-02 in 0.47 sec.
2025-11-14 17:39:58,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:58,576 - INFO - Going to convert document batch...
2025-11-14 17:39:58,576 - INFO - Processing document 4_2023-11-15
2025-11-14 17:39:58,595 - INFO - Finished converting document 4_2023-11-15 in 0.05 sec.
2025-11-14 17:39:58,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:58,636 - INFO - Going to convert document batch...
2025-11-14 17:39:58,636 - INFO - Processing document 4_2023-12-04
2025-11-14 17:39:58,659 - INFO - Finished converting document 4_2023-12-04 in 0.05 sec.
2025-11-14 17:39:58,696 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:58,705 - INFO - Going to convert document batch...
2025-11-14 17:39:58,706 - INFO - Processing document 4_2024-01-03
2025-11-14 17:39:58,724 - INFO - Finished converting document 4_2024-01-03 in 0.03 sec.
2025-1

Converted 'data\edgar_documents\T\4_2023-11-02' --> 'data\processed_data\T\4_2023-11-02.md'
Converted 'data\edgar_documents\T\4_2023-11-15' --> 'data\processed_data\T\4_2023-11-15.md'
Converted 'data\edgar_documents\T\4_2023-12-04' --> 'data\processed_data\T\4_2023-12-04.md'
Converted 'data\edgar_documents\T\4_2024-01-03' --> 'data\processed_data\T\4_2024-01-03.md'


2025-11-14 17:39:58,777 - INFO - Going to convert document batch...
2025-11-14 17:39:58,778 - INFO - Processing document 4_2024-01-17
2025-11-14 17:39:58,818 - INFO - Finished converting document 4_2024-01-17 in 0.06 sec.
2025-11-14 17:39:58,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:58,889 - INFO - Going to convert document batch...
2025-11-14 17:39:58,890 - INFO - Processing document 4_2024-01-29
2025-11-14 17:39:58,919 - INFO - Finished converting document 4_2024-01-29 in 0.08 sec.
2025-11-14 17:39:58,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:58,990 - INFO - Going to convert document batch...
2025-11-14 17:39:58,991 - INFO - Processing document 4_2024-02-02
2025-11-14 17:39:59,012 - INFO - Finished converting document 4_2024-02-02 in 0.08 sec.


Converted 'data\edgar_documents\T\4_2024-01-17' --> 'data\processed_data\T\4_2024-01-17.md'
Converted 'data\edgar_documents\T\4_2024-01-29' --> 'data\processed_data\T\4_2024-01-29.md'


2025-11-14 17:39:59,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,053 - INFO - Going to convert document batch...
2025-11-14 17:39:59,054 - INFO - Processing document 4_2024-02-20
2025-11-14 17:39:59,088 - INFO - Finished converting document 4_2024-02-20 in 0.05 sec.
2025-11-14 17:39:59,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,156 - INFO - Going to convert document batch...
2025-11-14 17:39:59,157 - INFO - Processing document 4_2024-02-21
2025-11-14 17:39:59,182 - INFO - Finished converting document 4_2024-02-21 in 0.06 sec.
2025-11-14 17:39:59,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\4_2024-02-02' --> 'data\processed_data\T\4_2024-02-02.md'
Converted 'data\edgar_documents\T\4_2024-02-20' --> 'data\processed_data\T\4_2024-02-20.md'
Converted 'data\edgar_documents\T\4_2024-02-21' --> 'data\processed_data\T\4_2024-02-21.md'


2025-11-14 17:39:59,234 - INFO - Going to convert document batch...
2025-11-14 17:39:59,235 - INFO - Processing document 4_2024-02-22
2025-11-14 17:39:59,262 - INFO - Finished converting document 4_2024-02-22 in 0.06 sec.
2025-11-14 17:39:59,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,312 - INFO - Going to convert document batch...
2025-11-14 17:39:59,313 - INFO - Processing document 4_2024-03-04
2025-11-14 17:39:59,342 - INFO - Finished converting document 4_2024-03-04 in 0.06 sec.
2025-11-14 17:39:59,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,418 - INFO - Going to convert document batch...
2025-11-14 17:39:59,418 - INFO - Processing document 4_2024-03-13
2025-11-14 17:39:59,441 - INFO - Finished converting document 4_2024-03-13 in 0.06 sec.


Converted 'data\edgar_documents\T\4_2024-02-22' --> 'data\processed_data\T\4_2024-02-22.md'
Converted 'data\edgar_documents\T\4_2024-03-04' --> 'data\processed_data\T\4_2024-03-04.md'
Converted 'data\edgar_documents\T\4_2024-03-13' --> 'data\processed_data\T\4_2024-03-13.md'


2025-11-14 17:39:59,490 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,500 - INFO - Going to convert document batch...
2025-11-14 17:39:59,501 - INFO - Processing document 4_2024-04-02
2025-11-14 17:39:59,524 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 17:39:59,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,570 - INFO - Going to convert document batch...
2025-11-14 17:39:59,571 - INFO - Processing document 4_2024-04-25
2025-11-14 17:39:59,595 - INFO - Finished converting document 4_2024-04-25 in 0.05 sec.
2025-11-14 17:39:59,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,643 - INFO - Going to convert document batch...
2025-11-14 17:39:59,644 - INFO - Processing document 4_2024-05-02
2025-11-14 17:39:59,669 - INFO - Finished converting document 4_2024-05-02 in 0.06 sec.
2025-11-14 17:39:59,707 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\T\4_2024-04-02' --> 'data\processed_data\T\4_2024-04-02.md'
Converted 'data\edgar_documents\T\4_2024-04-25' --> 'data\processed_data\T\4_2024-04-25.md'
Converted 'data\edgar_documents\T\4_2024-05-02' --> 'data\processed_data\T\4_2024-05-02.md'


2025-11-14 17:39:59,741 - INFO - Finished converting document 4_2024-06-04 in 0.05 sec.
2025-11-14 17:39:59,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,783 - INFO - Going to convert document batch...
2025-11-14 17:39:59,784 - INFO - Processing document 4_2024-06-17
2025-11-14 17:39:59,811 - INFO - Finished converting document 4_2024-06-17 in 0.05 sec.
2025-11-14 17:39:59,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,863 - INFO - Going to convert document batch...
2025-11-14 17:39:59,864 - INFO - Processing document 4_2024-07-01
2025-11-14 17:39:59,886 - INFO - Finished converting document 4_2024-07-01 in 0.05 sec.
2025-11-14 17:39:59,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,928 - INFO - Going to convert document batch...
2025-11-14 17:39:59,929 - INFO - Processing document 4_2024-07-02
2025-11-14 17:39:59,949 - INFO - Finished converting document 4_2024-07-02 in 0.05 sec.


Converted 'data\edgar_documents\T\4_2024-06-04' --> 'data\processed_data\T\4_2024-06-04.md'
Converted 'data\edgar_documents\T\4_2024-06-17' --> 'data\processed_data\T\4_2024-06-17.md'
Converted 'data\edgar_documents\T\4_2024-07-01' --> 'data\processed_data\T\4_2024-07-01.md'


2025-11-14 17:39:59,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:39:59,990 - INFO - Going to convert document batch...
2025-11-14 17:39:59,991 - INFO - Processing document 4_2024-07-30
2025-11-14 17:40:00,015 - INFO - Finished converting document 4_2024-07-30 in 0.05 sec.
2025-11-14 17:40:00,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,060 - INFO - Going to convert document batch...
2025-11-14 17:40:00,061 - INFO - Processing document 4_2024-08-02
2025-11-14 17:40:00,081 - INFO - Finished converting document 4_2024-08-02 in 0.03 sec.
2025-11-14 17:40:00,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,126 - INFO - Going to convert document batch...
2025-11-14 17:40:00,127 - INFO - Processing document 4_2024-08-06
2025-11-14 17:40:00,149 - INFO - Finished converting document 4_2024-08-06 in 0.03 sec.
2025-11-14 17:40:00,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\4_2024-07-02' --> 'data\processed_data\T\4_2024-07-02.md'
Converted 'data\edgar_documents\T\4_2024-07-30' --> 'data\processed_data\T\4_2024-07-30.md'
Converted 'data\edgar_documents\T\4_2024-08-02' --> 'data\processed_data\T\4_2024-08-02.md'
Converted 'data\edgar_documents\T\4_2024-08-06' --> 'data\processed_data\T\4_2024-08-06.md'


2025-11-14 17:40:00,198 - INFO - Going to convert document batch...
2025-11-14 17:40:00,199 - INFO - Processing document 4_2024-08-12
2025-11-14 17:40:00,231 - INFO - Finished converting document 4_2024-08-12 in 0.06 sec.
2025-11-14 17:40:00,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,278 - INFO - Going to convert document batch...
2025-11-14 17:40:00,278 - INFO - Processing document 4_2024-09-04
2025-11-14 17:40:00,303 - INFO - Finished converting document 4_2024-09-04 in 0.05 sec.
2025-11-14 17:40:00,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,347 - INFO - Going to convert document batch...
2025-11-14 17:40:00,348 - INFO - Processing document 4_2024-09-17
2025-11-14 17:40:00,373 - INFO - Finished converting document 4_2024-09-17 in 0.05 sec.
2025-11-14 17:40:00,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,430 - INFO - Going to convert document batch...
2025-11-14 17:40:00,431 - 

Converted 'data\edgar_documents\T\4_2024-08-12' --> 'data\processed_data\T\4_2024-08-12.md'
Converted 'data\edgar_documents\T\4_2024-09-04' --> 'data\processed_data\T\4_2024-09-04.md'
Converted 'data\edgar_documents\T\4_2024-09-17' --> 'data\processed_data\T\4_2024-09-17.md'


2025-11-14 17:40:00,452 - INFO - Finished converting document 4_2024-10-02 in 0.06 sec.
2025-11-14 17:40:00,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,500 - INFO - Going to convert document batch...
2025-11-14 17:40:00,501 - INFO - Processing document 4_2024-10-15
2025-11-14 17:40:00,525 - INFO - Finished converting document 4_2024-10-15 in 0.05 sec.
2025-11-14 17:40:00,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,570 - INFO - Going to convert document batch...
2025-11-14 17:40:00,571 - INFO - Processing document 4_2024-11-04
2025-11-14 17:40:00,610 - INFO - Finished converting document 4_2024-11-04 in 0.06 sec.
2025-11-14 17:40:00,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,658 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\T\4_2024-10-02' --> 'data\processed_data\T\4_2024-10-02.md'
Converted 'data\edgar_documents\T\4_2024-10-15' --> 'data\processed_data\T\4_2024-10-15.md'
Converted 'data\edgar_documents\T\4_2024-11-04' --> 'data\processed_data\T\4_2024-11-04.md'


2025-11-14 17:40:00,658 - INFO - Processing document 4_2024-12-03
2025-11-14 17:40:00,684 - INFO - Finished converting document 4_2024-12-03 in 0.05 sec.
2025-11-14 17:40:00,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,734 - INFO - Going to convert document batch...
2025-11-14 17:40:00,734 - INFO - Processing document 4_2024-12-17
2025-11-14 17:40:00,756 - INFO - Finished converting document 4_2024-12-17 in 0.05 sec.
2025-11-14 17:40:00,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,801 - INFO - Going to convert document batch...
2025-11-14 17:40:00,801 - INFO - Processing document 4_2025-01-03
2025-11-14 17:40:00,821 - INFO - Finished converting document 4_2025-01-03 in 0.03 sec.
2025-11-14 17:40:00,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,867 - INFO - Going to convert document batch...
2025-11-14 17:40:00,868 - INFO - Processing document 4_2025-01-17
2025-11-14 17:40:00,900 - IN

Converted 'data\edgar_documents\T\4_2024-12-03' --> 'data\processed_data\T\4_2024-12-03.md'
Converted 'data\edgar_documents\T\4_2024-12-17' --> 'data\processed_data\T\4_2024-12-17.md'
Converted 'data\edgar_documents\T\4_2025-01-03' --> 'data\processed_data\T\4_2025-01-03.md'


2025-11-14 17:40:00,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:00,951 - INFO - Going to convert document batch...
2025-11-14 17:40:00,951 - INFO - Processing document 4_2025-01-21
2025-11-14 17:40:00,976 - INFO - Finished converting document 4_2025-01-21 in 0.05 sec.
2025-11-14 17:40:01,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,020 - INFO - Going to convert document batch...
2025-11-14 17:40:01,021 - INFO - Processing document 4_2025-01-22
2025-11-14 17:40:01,044 - INFO - Finished converting document 4_2025-01-22 in 0.05 sec.
2025-11-14 17:40:01,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,093 - INFO - Going to convert document batch...
2025-11-14 17:40:01,094 - INFO - Processing document 4_2025-01-27


Converted 'data\edgar_documents\T\4_2025-01-17' --> 'data\processed_data\T\4_2025-01-17.md'
Converted 'data\edgar_documents\T\4_2025-01-21' --> 'data\processed_data\T\4_2025-01-21.md'
Converted 'data\edgar_documents\T\4_2025-01-22' --> 'data\processed_data\T\4_2025-01-22.md'


2025-11-14 17:40:01,125 - INFO - Finished converting document 4_2025-01-27 in 0.06 sec.
2025-11-14 17:40:01,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,187 - INFO - Going to convert document batch...
2025-11-14 17:40:01,188 - INFO - Processing document 4_2025-02-03
2025-11-14 17:40:01,212 - INFO - Finished converting document 4_2025-02-03 in 0.05 sec.
2025-11-14 17:40:01,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,254 - INFO - Going to convert document batch...
2025-11-14 17:40:01,256 - INFO - Processing document 4_2025-02-04
2025-11-14 17:40:01,277 - INFO - Finished converting document 4_2025-02-04 in 0.05 sec.
2025-11-14 17:40:01,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,316 - INFO - Going to convert document batch...
2025-11-14 17:40:01,317 - INFO - Processing document 4_2025-02-20
2025-11-14 17:40:01,336 - INFO - Finished converting document 4_2025-02-20 in 0.03 sec.
2025-1

Converted 'data\edgar_documents\T\4_2025-01-27' --> 'data\processed_data\T\4_2025-01-27.md'
Converted 'data\edgar_documents\T\4_2025-02-03' --> 'data\processed_data\T\4_2025-02-03.md'
Converted 'data\edgar_documents\T\4_2025-02-04' --> 'data\processed_data\T\4_2025-02-04.md'
Converted 'data\edgar_documents\T\4_2025-02-20' --> 'data\processed_data\T\4_2025-02-20.md'


2025-11-14 17:40:01,376 - INFO - Going to convert document batch...
2025-11-14 17:40:01,377 - INFO - Processing document 4_2025-02-21
2025-11-14 17:40:01,399 - INFO - Finished converting document 4_2025-02-21 in 0.03 sec.
2025-11-14 17:40:01,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,443 - INFO - Going to convert document batch...
2025-11-14 17:40:01,444 - INFO - Processing document 4_2025-02-26
2025-11-14 17:40:01,471 - INFO - Finished converting document 4_2025-02-26 in 0.05 sec.
2025-11-14 17:40:01,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,514 - INFO - Going to convert document batch...
2025-11-14 17:40:01,515 - INFO - Processing document 4_2025-02-27
2025-11-14 17:40:01,541 - INFO - Finished converting document 4_2025-02-27 in 0.03 sec.
2025-11-14 17:40:01,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,581 - INFO - Going to convert document batch...
2025-11-14 17:40:01,582 - 

Converted 'data\edgar_documents\T\4_2025-02-21' --> 'data\processed_data\T\4_2025-02-21.md'
Converted 'data\edgar_documents\T\4_2025-02-26' --> 'data\processed_data\T\4_2025-02-26.md'
Converted 'data\edgar_documents\T\4_2025-02-27' --> 'data\processed_data\T\4_2025-02-27.md'


2025-11-14 17:40:01,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,643 - INFO - Going to convert document batch...
2025-11-14 17:40:01,644 - INFO - Processing document 4_2025-03-11
2025-11-14 17:40:01,666 - INFO - Finished converting document 4_2025-03-11 in 0.03 sec.
2025-11-14 17:40:01,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,709 - INFO - Going to convert document batch...
2025-11-14 17:40:01,710 - INFO - Processing document 4_2025-03-18
2025-11-14 17:40:01,731 - INFO - Finished converting document 4_2025-03-18 in 0.05 sec.
2025-11-14 17:40:01,797 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:40:01,798 - ERROR - Input document 4_2025-03-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\T\4_2025-03-04' --> 'data\processed_data\T\4_2025-03-04.md'
Converted 'data\edgar_documents\T\4_2025-03-11' --> 'data\processed_data\T\4_2025-03-11.md'
Converted 'data\edgar_documents\T\4_2025-03-18' --> 'data\processed_data\T\4_2025-03-18.md'
Error processing data\edgar_documents\T\4_2025-03-26: File format not allowed: data\edgar_documents\T\4_2025-03-26


2025-11-14 17:40:01,827 - INFO - Going to convert document batch...
2025-11-14 17:40:01,828 - INFO - Processing document 4_2025-04-02
2025-11-14 17:40:01,847 - INFO - Finished converting document 4_2025-04-02 in 0.05 sec.
2025-11-14 17:40:01,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,890 - INFO - Going to convert document batch...
2025-11-14 17:40:01,892 - INFO - Processing document 4_2025-05-02
2025-11-14 17:40:01,935 - INFO - Finished converting document 4_2025-05-02 in 0.06 sec.
2025-11-14 17:40:01,975 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:01,984 - INFO - Going to convert document batch...
2025-11-14 17:40:01,984 - INFO - Processing document 4_2025-05-14
2025-11-14 17:40:02,003 - INFO - Finished converting document 4_2025-05-14 in 0.05 sec.
2025-11-14 17:40:02,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:02,044 - INFO - Going to convert document batch...
2025-11-14 17:40:02,045 - 

Converted 'data\edgar_documents\T\4_2025-04-02' --> 'data\processed_data\T\4_2025-04-02.md'
Converted 'data\edgar_documents\T\4_2025-05-02' --> 'data\processed_data\T\4_2025-05-02.md'
Converted 'data\edgar_documents\T\4_2025-05-14' --> 'data\processed_data\T\4_2025-05-14.md'


2025-11-14 17:40:02,106 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:40:02,107 - ERROR - Input document 4_2025-05-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:40:02,108 - INFO - Going to convert document batch...
2025-11-14 17:40:02,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:02,131 - INFO - Going to convert document batch...
2025-11-14 17:40:02,132 - INFO - Processing document 4_2025-06-03
2025-11-14 17:40:02,152 - INFO - Fin

Converted 'data\edgar_documents\T\4_2025-05-19' --> 'data\processed_data\T\4_2025-05-19.md'
Error processing data\edgar_documents\T\4_2025-05-30: File format not allowed: data\edgar_documents\T\4_2025-05-30
Converted 'data\edgar_documents\T\4_2025-06-03' --> 'data\processed_data\T\4_2025-06-03.md'
Converted 'data\edgar_documents\T\4_2025-07-02' --> 'data\processed_data\T\4_2025-07-02.md'


2025-11-14 17:40:02,287 - INFO - Going to convert document batch...
2025-11-14 17:40:02,288 - INFO - Processing document 4_2025-07-30
2025-11-14 17:40:02,563 - INFO - Finished converting document 4_2025-07-30 in 0.33 sec.
2025-11-14 17:40:02,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:02,606 - INFO - Going to convert document batch...
2025-11-14 17:40:02,607 - INFO - Processing document 4_2025-08-04
2025-11-14 17:40:02,626 - INFO - Finished converting document 4_2025-08-04 in 0.05 sec.
2025-11-14 17:40:02,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:02,665 - INFO - Going to convert document batch...
2025-11-14 17:40:02,666 - INFO - Processing document 4_2025-09-03
2025-11-14 17:40:02,688 - INFO - Finished converting document 4_2025-09-03 in 0.05 sec.
2025-11-14 17:40:02,749 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:40:02,750 - ERROR - Input document 4_2025-09-11 with format None does 

Converted 'data\edgar_documents\T\4_2025-07-30' --> 'data\processed_data\T\4_2025-07-30.md'
Converted 'data\edgar_documents\T\4_2025-08-04' --> 'data\processed_data\T\4_2025-08-04.md'
Converted 'data\edgar_documents\T\4_2025-09-03' --> 'data\processed_data\T\4_2025-09-03.md'
Error processing data\edgar_documents\T\4_2025-09-11: File format not allowed: data\edgar_documents\T\4_2025-09-11


2025-11-14 17:40:02,770 - ERROR - Input document 4_2025-09-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:40:02,771 - INFO - Going to convert document batch...
2025-11-14 17:40:02,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:02,793 - INFO - Going to convert document batch...
2025-11-14 17:40:02,794 - INFO - Processing document 4_2025-09-25
2025-11-14 17:40:02,813 - INFO - Finished converting document 4_2025-09-25 in 0.05 sec.
2025-11-14 17:40:02,848 - INFO - detec

Error processing data\edgar_documents\T\4_2025-09-19: File format not allowed: data\edgar_documents\T\4_2025-09-19
Converted 'data\edgar_documents\T\4_2025-09-25' --> 'data\processed_data\T\4_2025-09-25.md'
Converted 'data\edgar_documents\T\4_2025-10-02' --> 'data\processed_data\T\4_2025-10-02.md'
Converted 'data\edgar_documents\T\4_2025-10-16' --> 'data\processed_data\T\4_2025-10-16.md'


2025-11-14 17:40:02,980 - INFO - Going to convert document batch...
2025-11-14 17:40:02,980 - INFO - Processing document 4_2025-10-23
2025-11-14 17:40:03,001 - INFO - Finished converting document 4_2025-10-23 in 0.05 sec.
2025-11-14 17:40:03,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:03,059 - INFO - Going to convert document batch...
2025-11-14 17:40:03,060 - INFO - Processing document 4_2025-10-28
2025-11-14 17:40:03,087 - INFO - Finished converting document 4_2025-10-28 in 0.06 sec.
2025-11-14 17:40:03,126 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:03,136 - INFO - Going to convert document batch...
2025-11-14 17:40:03,137 - INFO - Processing document 4_2025-11-04
2025-11-14 17:40:03,164 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 17:40:03,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\4_2025-10-23' --> 'data\processed_data\T\4_2025-10-23.md'
Converted 'data\edgar_documents\T\4_2025-10-28' --> 'data\processed_data\T\4_2025-10-28.md'
Converted 'data\edgar_documents\T\4_2025-11-04' --> 'data\processed_data\T\4_2025-11-04.md'


2025-11-14 17:40:03,231 - INFO - Going to convert document batch...
2025-11-14 17:40:03,231 - INFO - Processing document 8-K_2023-01-25
2025-11-14 17:40:03,277 - INFO - Finished converting document 8-K_2023-01-25 in 0.09 sec.
2025-11-14 17:40:03,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:03,345 - INFO - Going to convert document batch...
2025-11-14 17:40:03,346 - INFO - Processing document 8-K_2023-02-02
2025-11-14 17:40:03,382 - INFO - Finished converting document 8-K_2023-02-02 in 0.08 sec.
2025-11-14 17:40:03,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:03,465 - INFO - Going to convert document batch...
2025-11-14 17:40:03,466 - INFO - Processing document 8-K_2023-02-22


Converted 'data\edgar_documents\T\8-K_2023-01-25' --> 'data\processed_data\T\8-K_2023-01-25.md'
Converted 'data\edgar_documents\T\8-K_2023-02-02' --> 'data\processed_data\T\8-K_2023-02-02.md'


2025-11-14 17:40:03,501 - INFO - Finished converting document 8-K_2023-02-22 in 0.11 sec.
2025-11-14 17:40:03,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:03,562 - INFO - Going to convert document batch...
2025-11-14 17:40:03,563 - INFO - Processing document 8-K_2023-03-03
2025-11-14 17:40:03,601 - INFO - Finished converting document 8-K_2023-03-03 in 0.08 sec.
2025-11-14 17:40:03,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:03,686 - INFO - Going to convert document batch...
2025-11-14 17:40:03,687 - INFO - Processing document 8-K_2023-03-06
2025-11-14 17:40:03,723 - INFO - Finished converting document 8-K_2023-03-06 in 0.09 sec.


Converted 'data\edgar_documents\T\8-K_2023-02-22' --> 'data\processed_data\T\8-K_2023-02-22.md'
Converted 'data\edgar_documents\T\8-K_2023-03-03' --> 'data\processed_data\T\8-K_2023-03-03.md'


2025-11-14 17:40:03,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:03,790 - INFO - Going to convert document batch...
2025-11-14 17:40:03,792 - INFO - Processing document 8-K_2023-04-07
2025-11-14 17:40:03,851 - INFO - Finished converting document 8-K_2023-04-07 in 0.11 sec.
2025-11-14 17:40:03,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:03,915 - INFO - Going to convert document batch...
2025-11-14 17:40:03,916 - INFO - Processing document 8-K_2023-04-20


Converted 'data\edgar_documents\T\8-K_2023-03-06' --> 'data\processed_data\T\8-K_2023-03-06.md'
Converted 'data\edgar_documents\T\8-K_2023-04-07' --> 'data\processed_data\T\8-K_2023-04-07.md'


2025-11-14 17:40:03,954 - INFO - Finished converting document 8-K_2023-04-20 in 0.09 sec.
2025-11-14 17:40:03,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:04,023 - INFO - Going to convert document batch...
2025-11-14 17:40:04,024 - INFO - Processing document 8-K_2023-05-01
2025-11-14 17:40:04,060 - INFO - Finished converting document 8-K_2023-05-01 in 0.09 sec.
2025-11-14 17:40:04,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:04,121 - INFO - Going to convert document batch...
2025-11-14 17:40:04,122 - INFO - Processing document 8-K_2023-05-03
2025-11-14 17:40:04,157 - INFO - Finished converting document 8-K_2023-05-03 in 0.08 sec.


Converted 'data\edgar_documents\T\8-K_2023-04-20' --> 'data\processed_data\T\8-K_2023-04-20.md'
Converted 'data\edgar_documents\T\8-K_2023-05-01' --> 'data\processed_data\T\8-K_2023-05-01.md'


2025-11-14 17:40:04,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:04,221 - INFO - Going to convert document batch...
2025-11-14 17:40:04,222 - INFO - Processing document 8-K_2023-05-18
2025-11-14 17:40:04,259 - INFO - Finished converting document 8-K_2023-05-18 in 0.08 sec.
2025-11-14 17:40:04,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:04,356 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\T\8-K_2023-05-03' --> 'data\processed_data\T\8-K_2023-05-03.md'
Converted 'data\edgar_documents\T\8-K_2023-05-18' --> 'data\processed_data\T\8-K_2023-05-18.md'


2025-11-14 17:40:04,357 - INFO - Processing document 8-K_2023-05-23
2025-11-14 17:40:04,423 - INFO - Finished converting document 8-K_2023-05-23 in 0.16 sec.
2025-11-14 17:40:04,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:04,496 - INFO - Going to convert document batch...
2025-11-14 17:40:04,497 - INFO - Processing document 8-K_2023-06-02
2025-11-14 17:40:04,538 - INFO - Finished converting document 8-K_2023-06-02 in 0.08 sec.
2025-11-14 17:40:04,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:04,594 - INFO - Going to convert document batch...
2025-11-14 17:40:04,596 - INFO - Processing document 8-K_2023-07-26
2025-11-14 17:40:04,635 - INFO - Finished converting document 8-K_2023-07-26 in 0.09 sec.


Converted 'data\edgar_documents\T\8-K_2023-05-23' --> 'data\processed_data\T\8-K_2023-05-23.md'
Converted 'data\edgar_documents\T\8-K_2023-06-02' --> 'data\processed_data\T\8-K_2023-06-02.md'


2025-11-14 17:40:04,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:04,703 - INFO - Going to convert document batch...
2025-11-14 17:40:04,704 - INFO - Processing document 8-K_2023-10-19
2025-11-14 17:40:04,745 - INFO - Finished converting document 8-K_2023-10-19 in 0.09 sec.
2025-11-14 17:40:04,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:04,822 - INFO - Going to convert document batch...
2025-11-14 17:40:04,823 - INFO - Processing document 8-K_2024-01-24


Converted 'data\edgar_documents\T\8-K_2023-07-26' --> 'data\processed_data\T\8-K_2023-07-26.md'
Converted 'data\edgar_documents\T\8-K_2023-10-19' --> 'data\processed_data\T\8-K_2023-10-19.md'


2025-11-14 17:40:04,863 - INFO - Finished converting document 8-K_2024-01-24 in 0.09 sec.
2025-11-14 17:40:04,900 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:04,925 - INFO - Going to convert document batch...
2025-11-14 17:40:04,926 - INFO - Processing document 8-K_2024-03-01
2025-11-14 17:40:04,962 - INFO - Finished converting document 8-K_2024-03-01 in 0.06 sec.
2025-11-14 17:40:05,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:05,040 - INFO - Going to convert document batch...
2025-11-14 17:40:05,041 - INFO - Processing document 8-K_2024-04-24
2025-11-14 17:40:05,079 - INFO - Finished converting document 8-K_2024-04-24 in 0.09 sec.


Converted 'data\edgar_documents\T\8-K_2024-01-24' --> 'data\processed_data\T\8-K_2024-01-24.md'
Converted 'data\edgar_documents\T\8-K_2024-03-01' --> 'data\processed_data\T\8-K_2024-03-01.md'


2025-11-14 17:40:05,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\8-K_2024-04-24' --> 'data\processed_data\T\8-K_2024-04-24.md'


2025-11-14 17:40:05,385 - INFO - Going to convert document batch...
2025-11-14 17:40:05,386 - INFO - Processing document 8-K_2024-05-21
2025-11-14 17:40:05,448 - INFO - Finished converting document 8-K_2024-05-21 in 0.36 sec.
2025-11-14 17:40:05,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:05,533 - INFO - Going to convert document batch...
2025-11-14 17:40:05,533 - INFO - Processing document 8-K_2024-07-12
2025-11-14 17:40:05,567 - INFO - Finished converting document 8-K_2024-07-12 in 0.09 sec.
2025-11-14 17:40:05,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:05,620 - INFO - Going to convert document batch...
2025-11-14 17:40:05,621 - INFO - Processing document 8-K_2024-07-24
2025-11-14 17:40:05,655 - INFO - Finished converting document 8-K_2024-07-24 in 0.08 sec.


Converted 'data\edgar_documents\T\8-K_2024-05-21' --> 'data\processed_data\T\8-K_2024-05-21.md'
Converted 'data\edgar_documents\T\8-K_2024-07-12' --> 'data\processed_data\T\8-K_2024-07-12.md'


2025-11-14 17:40:05,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:05,719 - INFO - Going to convert document batch...
2025-11-14 17:40:05,720 - INFO - Processing document 8-K_2024-09-30
2025-11-14 17:40:05,760 - INFO - Finished converting document 8-K_2024-09-30 in 0.09 sec.
2025-11-14 17:40:05,793 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:05,816 - INFO - Going to convert document batch...
2025-11-14 17:40:05,817 - INFO - Processing document 8-K_2024-10-23
2025-11-14 17:40:05,857 - INFO - Finished converting document 8-K_2024-10-23 in 0.08 sec.


Converted 'data\edgar_documents\T\8-K_2024-07-24' --> 'data\processed_data\T\8-K_2024-07-24.md'
Converted 'data\edgar_documents\T\8-K_2024-09-30' --> 'data\processed_data\T\8-K_2024-09-30.md'


2025-11-14 17:40:05,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:05,914 - INFO - Going to convert document batch...
2025-11-14 17:40:05,915 - INFO - Processing document 8-K_2024-12-03
2025-11-14 17:40:05,954 - INFO - Finished converting document 8-K_2024-12-03 in 0.08 sec.
2025-11-14 17:40:06,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,036 - INFO - Going to convert document batch...
2025-11-14 17:40:06,037 - INFO - Processing document 8-K_2025-01-27
2025-11-14 17:40:06,073 - INFO - Finished converting document 8-K_2025-01-27 in 0.11 sec.


Converted 'data\edgar_documents\T\8-K_2024-10-23' --> 'data\processed_data\T\8-K_2024-10-23.md'
Converted 'data\edgar_documents\T\8-K_2024-12-03' --> 'data\processed_data\T\8-K_2024-12-03.md'


2025-11-14 17:40:06,108 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,147 - INFO - Going to convert document batch...
2025-11-14 17:40:06,149 - INFO - Processing document 8-K_2025-02-05
2025-11-14 17:40:06,191 - INFO - Finished converting document 8-K_2025-02-05 in 0.09 sec.
2025-11-14 17:40:06,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,256 - INFO - Going to convert document batch...
2025-11-14 17:40:06,257 - INFO - Processing document 8-K_2025-03-31


Converted 'data\edgar_documents\T\8-K_2025-01-27' --> 'data\processed_data\T\8-K_2025-01-27.md'
Converted 'data\edgar_documents\T\8-K_2025-02-05' --> 'data\processed_data\T\8-K_2025-02-05.md'


2025-11-14 17:40:06,296 - INFO - Finished converting document 8-K_2025-03-31 in 0.09 sec.
2025-11-14 17:40:06,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,352 - INFO - Going to convert document batch...
2025-11-14 17:40:06,353 - INFO - Processing document 8-K_2025-04-23
2025-11-14 17:40:06,390 - INFO - Finished converting document 8-K_2025-04-23 in 0.08 sec.
2025-11-14 17:40:06,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,468 - INFO - Going to convert document batch...
2025-11-14 17:40:06,468 - INFO - Processing document 8-K_2025-05-19
2025-11-14 17:40:06,524 - INFO - Finished converting document 8-K_2025-05-19 in 0.11 sec.


Converted 'data\edgar_documents\T\8-K_2025-03-31' --> 'data\processed_data\T\8-K_2025-03-31.md'
Converted 'data\edgar_documents\T\8-K_2025-04-23' --> 'data\processed_data\T\8-K_2025-04-23.md'


2025-11-14 17:40:06,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,590 - INFO - Going to convert document batch...
2025-11-14 17:40:06,591 - INFO - Processing document 8-K_2025-05-21
2025-11-14 17:40:06,636 - INFO - Finished converting document 8-K_2025-05-21 in 0.09 sec.
2025-11-14 17:40:06,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,715 - INFO - Going to convert document batch...
2025-11-14 17:40:06,715 - INFO - Processing document 8-K_2025-06-03


Converted 'data\edgar_documents\T\8-K_2025-05-19' --> 'data\processed_data\T\8-K_2025-05-19.md'
Converted 'data\edgar_documents\T\8-K_2025-05-21' --> 'data\processed_data\T\8-K_2025-05-21.md'


2025-11-14 17:40:06,751 - INFO - Finished converting document 8-K_2025-06-03 in 0.09 sec.
2025-11-14 17:40:06,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,807 - INFO - Going to convert document batch...
2025-11-14 17:40:06,808 - INFO - Processing document 8-K_2025-07-23
2025-11-14 17:40:06,848 - INFO - Finished converting document 8-K_2025-07-23 in 0.08 sec.
2025-11-14 17:40:06,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,911 - INFO - Going to convert document batch...
2025-11-14 17:40:06,912 - INFO - Processing document 8-K_2025-08-19
2025-11-14 17:40:06,943 - INFO - Finished converting document 8-K_2025-08-19 in 0.06 sec.


Converted 'data\edgar_documents\T\8-K_2025-06-03' --> 'data\processed_data\T\8-K_2025-06-03.md'
Converted 'data\edgar_documents\T\8-K_2025-07-23' --> 'data\processed_data\T\8-K_2025-07-23.md'


2025-11-14 17:40:06,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:06,999 - INFO - Going to convert document batch...
2025-11-14 17:40:07,000 - INFO - Processing document 8-K_2025-08-26
2025-11-14 17:40:07,064 - INFO - Finished converting document 8-K_2025-08-26 in 0.11 sec.
2025-11-14 17:40:07,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:07,129 - INFO - Going to convert document batch...
2025-11-14 17:40:07,130 - INFO - Processing document 8-K_2025-09-16


Converted 'data\edgar_documents\T\8-K_2025-08-19' --> 'data\processed_data\T\8-K_2025-08-19.md'
Converted 'data\edgar_documents\T\8-K_2025-08-26' --> 'data\processed_data\T\8-K_2025-08-26.md'


2025-11-14 17:40:07,164 - INFO - Finished converting document 8-K_2025-09-16 in 0.08 sec.
2025-11-14 17:40:07,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:07,228 - INFO - Going to convert document batch...
2025-11-14 17:40:07,229 - INFO - Processing document 8-K_2025-09-24
2025-11-14 17:40:07,272 - INFO - Finished converting document 8-K_2025-09-24 in 0.09 sec.
2025-11-14 17:40:07,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:07,324 - INFO - Going to convert document batch...
2025-11-14 17:40:07,325 - INFO - Processing document 8-K_2025-10-22
2025-11-14 17:40:07,362 - INFO - Finished converting document 8-K_2025-10-22 in 0.08 sec.


Converted 'data\edgar_documents\T\8-K_2025-09-16' --> 'data\processed_data\T\8-K_2025-09-16.md'
Converted 'data\edgar_documents\T\8-K_2025-09-24' --> 'data\processed_data\T\8-K_2025-09-24.md'


2025-11-14 17:40:07,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:07,439 - INFO - Going to convert document batch...
2025-11-14 17:40:07,440 - INFO - Processing document 8-K_2025-11-03
2025-11-14 17:40:07,519 - INFO - Finished converting document 8-K_2025-11-03 in 0.12 sec.


Converted 'data\edgar_documents\T\8-K_2025-10-22' --> 'data\processed_data\T\8-K_2025-10-22.md'
Converted 'data\edgar_documents\T\8-K_2025-11-03' --> 'data\processed_data\T\8-K_2025-11-03.md'


2025-11-14 17:40:07,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:08,557 - INFO - Going to convert document batch...
2025-11-14 17:40:08,560 - INFO - Processing document DEF-14A_2023-04-03
2025-11-14 17:40:10,071 - INFO - Finished converting document DEF-14A_2023-04-03 in 2.52 sec.
2025-11-14 17:40:10,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\DEF-14A_2023-04-03' --> 'data\processed_data\T\DEF-14A_2023-04-03.md'


2025-11-14 17:40:11,699 - INFO - Going to convert document batch...
2025-11-14 17:40:11,700 - INFO - Processing document DEF-14A_2024-04-04
2025-11-14 17:40:12,902 - INFO - Finished converting document DEF-14A_2024-04-04 in 2.19 sec.
2025-11-14 17:40:13,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\DEF-14A_2024-04-04' --> 'data\processed_data\T\DEF-14A_2024-04-04.md'


2025-11-14 17:40:14,305 - INFO - Going to convert document batch...
2025-11-14 17:40:14,306 - INFO - Processing document DEF-14A_2025-04-04
2025-11-14 17:40:16,056 - INFO - Finished converting document DEF-14A_2025-04-04 in 2.47 sec.
2025-11-14 17:40:16,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\T\DEF-14A_2025-04-04' --> 'data\processed_data\T\DEF-14A_2025-04-04.md'
Processed 132 new files. Errors: 8
Found 85 files to process in data\edgar_documents\TGT


2025-11-14 17:40:17,174 - INFO - Going to convert document batch...
2025-11-14 17:40:17,175 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:40:17,175 - INFO - Processing document 10-K_2023-03-08
2025-11-14 17:40:19,105 - INFO - Finished converting document 10-K_2023-03-08 in 2.42 sec.
2025-11-14 17:40:19,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-K_2023-03-08' --> 'data\processed_data\TGT\10-K_2023-03-08.md'


2025-11-14 17:40:20,569 - INFO - Going to convert document batch...
2025-11-14 17:40:20,570 - INFO - Processing document 10-K_2024-03-13
2025-11-14 17:40:22,599 - INFO - Finished converting document 10-K_2024-03-13 in 2.97 sec.
2025-11-14 17:40:23,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-K_2024-03-13' --> 'data\processed_data\TGT\10-K_2024-03-13.md'


2025-11-14 17:40:23,917 - INFO - Going to convert document batch...
2025-11-14 17:40:23,918 - INFO - Processing document 10-K_2025-03-12
2025-11-14 17:40:26,058 - INFO - Finished converting document 10-K_2025-03-12 in 2.94 sec.
2025-11-14 17:40:26,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-K_2025-03-12' --> 'data\processed_data\TGT\10-K_2025-03-12.md'


2025-11-14 17:40:26,912 - INFO - Going to convert document batch...
2025-11-14 17:40:26,912 - INFO - Processing document 10-Q_2023-05-26
2025-11-14 17:40:27,514 - INFO - Finished converting document 10-Q_2023-05-26 in 0.86 sec.
2025-11-14 17:40:27,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-Q_2023-05-26' --> 'data\processed_data\TGT\10-Q_2023-05-26.md'


2025-11-14 17:40:28,077 - INFO - Going to convert document batch...
2025-11-14 17:40:28,078 - INFO - Processing document 10-Q_2023-08-25
2025-11-14 17:40:29,057 - INFO - Finished converting document 10-Q_2023-08-25 in 1.27 sec.
2025-11-14 17:40:29,389 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-Q_2023-08-25' --> 'data\processed_data\TGT\10-Q_2023-08-25.md'


2025-11-14 17:40:29,655 - INFO - Going to convert document batch...
2025-11-14 17:40:29,656 - INFO - Processing document 10-Q_2023-11-22
2025-11-14 17:40:30,255 - INFO - Finished converting document 10-Q_2023-11-22 in 0.89 sec.
2025-11-14 17:40:30,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-Q_2023-11-22' --> 'data\processed_data\TGT\10-Q_2023-11-22.md'


2025-11-14 17:40:30,796 - INFO - Going to convert document batch...
2025-11-14 17:40:30,797 - INFO - Processing document 10-Q_2024-05-31
2025-11-14 17:40:31,309 - INFO - Finished converting document 10-Q_2024-05-31 in 0.75 sec.
2025-11-14 17:40:31,617 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-Q_2024-05-31' --> 'data\processed_data\TGT\10-Q_2024-05-31.md'


2025-11-14 17:40:32,198 - INFO - Going to convert document batch...
2025-11-14 17:40:32,200 - INFO - Processing document 10-Q_2024-08-30
2025-11-14 17:40:32,774 - INFO - Finished converting document 10-Q_2024-08-30 in 1.19 sec.
2025-11-14 17:40:33,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-Q_2024-08-30' --> 'data\processed_data\TGT\10-Q_2024-08-30.md'


2025-11-14 17:40:33,340 - INFO - Going to convert document batch...
2025-11-14 17:40:33,341 - INFO - Processing document 10-Q_2024-11-27
2025-11-14 17:40:33,937 - INFO - Finished converting document 10-Q_2024-11-27 in 0.88 sec.
2025-11-14 17:40:34,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-Q_2024-11-27' --> 'data\processed_data\TGT\10-Q_2024-11-27.md'


2025-11-14 17:40:34,742 - INFO - Going to convert document batch...
2025-11-14 17:40:34,743 - INFO - Processing document 10-Q_2025-05-30
2025-11-14 17:40:35,288 - INFO - Finished converting document 10-Q_2025-05-30 in 1.05 sec.
2025-11-14 17:40:35,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\10-Q_2025-05-30' --> 'data\processed_data\TGT\10-Q_2025-05-30.md'


2025-11-14 17:40:35,868 - INFO - Going to convert document batch...
2025-11-14 17:40:35,869 - INFO - Processing document 10-Q_2025-08-29
2025-11-14 17:40:36,543 - INFO - Finished converting document 10-Q_2025-08-29 in 0.97 sec.
2025-11-14 17:40:36,919 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:40:36,921 - ERROR - Input document 4_2023-01-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:40:36,922 - INFO - Going to convert document batch...
2025-11-14 17:40:36,95

Converted 'data\edgar_documents\TGT\10-Q_2025-08-29' --> 'data\processed_data\TGT\10-Q_2025-08-29.md'
Error processing data\edgar_documents\TGT\4_2023-01-17: File format not allowed: data\edgar_documents\TGT\4_2023-01-17
Error processing data\edgar_documents\TGT\4_2023-01-18: File format not allowed: data\edgar_documents\TGT\4_2023-01-18
Converted 'data\edgar_documents\TGT\4_2023-03-10' --> 'data\processed_data\TGT\4_2023-03-10.md'


2025-11-14 17:40:37,059 - INFO - Going to convert document batch...
2025-11-14 17:40:37,060 - INFO - Processing document 4_2023-03-14
2025-11-14 17:40:37,080 - INFO - Finished converting document 4_2023-03-14 in 0.05 sec.
2025-11-14 17:40:37,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,124 - INFO - Going to convert document batch...
2025-11-14 17:40:37,125 - INFO - Processing document 4_2023-04-04
2025-11-14 17:40:37,146 - INFO - Finished converting document 4_2023-04-04 in 0.03 sec.
2025-11-14 17:40:37,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,219 - INFO - Going to convert document batch...
2025-11-14 17:40:37,220 - INFO - Processing document 4_2023-04-06
2025-11-14 17:40:37,240 - INFO - Finished converting document 4_2023-04-06 in 0.05 sec.
2025-11-14 17:40:37,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,287 - INFO - Going to convert document batch...
2025-11-14 17:40:37,288 - 

Converted 'data\edgar_documents\TGT\4_2023-03-14' --> 'data\processed_data\TGT\4_2023-03-14.md'
Converted 'data\edgar_documents\TGT\4_2023-04-04' --> 'data\processed_data\TGT\4_2023-04-04.md'
Converted 'data\edgar_documents\TGT\4_2023-04-06' --> 'data\processed_data\TGT\4_2023-04-06.md'


2025-11-14 17:40:37,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,349 - INFO - Going to convert document batch...
2025-11-14 17:40:37,350 - INFO - Processing document 4_2023-06-29
2025-11-14 17:40:37,371 - INFO - Finished converting document 4_2023-06-29 in 0.05 sec.
2025-11-14 17:40:37,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,430 - INFO - Going to convert document batch...
2025-11-14 17:40:37,431 - INFO - Processing document 4_2023-08-22
2025-11-14 17:40:37,452 - INFO - Finished converting document 4_2023-08-22 in 0.06 sec.
2025-11-14 17:40:37,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,520 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TGT\4_2023-05-22' --> 'data\processed_data\TGT\4_2023-05-22.md'
Converted 'data\edgar_documents\TGT\4_2023-06-29' --> 'data\processed_data\TGT\4_2023-06-29.md'
Converted 'data\edgar_documents\TGT\4_2023-08-22' --> 'data\processed_data\TGT\4_2023-08-22.md'


2025-11-14 17:40:37,521 - INFO - Processing document 4_2023-11-02
2025-11-14 17:40:37,543 - INFO - Finished converting document 4_2023-11-02 in 0.06 sec.
2025-11-14 17:40:37,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,586 - INFO - Going to convert document batch...
2025-11-14 17:40:37,587 - INFO - Processing document 4_2023-11-17
2025-11-14 17:40:37,606 - INFO - Finished converting document 4_2023-11-17 in 0.05 sec.
2025-11-14 17:40:37,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,647 - INFO - Going to convert document batch...
2025-11-14 17:40:37,648 - INFO - Processing document 4_2023-11-27
2025-11-14 17:40:37,672 - INFO - Finished converting document 4_2023-11-27 in 0.05 sec.
2025-11-14 17:40:37,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,715 - INFO - Going to convert document batch...
2025-11-14 17:40:37,716 - INFO - Processing document 4_2023-11-29
2025-11-14 17:40:37,732 - IN

Converted 'data\edgar_documents\TGT\4_2023-11-02' --> 'data\processed_data\TGT\4_2023-11-02.md'
Converted 'data\edgar_documents\TGT\4_2023-11-17' --> 'data\processed_data\TGT\4_2023-11-17.md'
Converted 'data\edgar_documents\TGT\4_2023-11-27' --> 'data\processed_data\TGT\4_2023-11-27.md'


2025-11-14 17:40:37,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,770 - INFO - Going to convert document batch...
2025-11-14 17:40:37,771 - INFO - Processing document 4_2024-01-31
2025-11-14 17:40:37,791 - INFO - Finished converting document 4_2024-01-31 in 0.03 sec.
2025-11-14 17:40:37,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,832 - INFO - Going to convert document batch...
2025-11-14 17:40:37,832 - INFO - Processing document 4_2024-03-07
2025-11-14 17:40:37,852 - INFO - Finished converting document 4_2024-03-07 in 0.03 sec.
2025-11-14 17:40:37,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,907 - INFO - Going to convert document batch...
2025-11-14 17:40:37,908 - INFO - Processing document 4_2024-03-11
2025-11-14 17:40:37,926 - INFO - Finished converting document 4_2024-03-11 in 0.05 sec.


Converted 'data\edgar_documents\TGT\4_2023-11-29' --> 'data\processed_data\TGT\4_2023-11-29.md'
Converted 'data\edgar_documents\TGT\4_2024-01-31' --> 'data\processed_data\TGT\4_2024-01-31.md'
Converted 'data\edgar_documents\TGT\4_2024-03-07' --> 'data\processed_data\TGT\4_2024-03-07.md'


2025-11-14 17:40:37,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:37,965 - INFO - Going to convert document batch...
2025-11-14 17:40:37,967 - INFO - Processing document 4_2024-03-12
2025-11-14 17:40:37,987 - INFO - Finished converting document 4_2024-03-12 in 0.05 sec.
2025-11-14 17:40:38,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:38,051 - INFO - Going to convert document batch...
2025-11-14 17:40:38,052 - INFO - Processing document 4_2024-03-13
2025-11-14 17:40:38,084 - INFO - Finished converting document 4_2024-03-13 in 0.06 sec.
2025-11-14 17:40:38,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\4_2024-03-11' --> 'data\processed_data\TGT\4_2024-03-11.md'
Converted 'data\edgar_documents\TGT\4_2024-03-12' --> 'data\processed_data\TGT\4_2024-03-12.md'
Converted 'data\edgar_documents\TGT\4_2024-03-13' --> 'data\processed_data\TGT\4_2024-03-13.md'


2025-11-14 17:40:38,127 - INFO - Going to convert document batch...
2025-11-14 17:40:38,128 - INFO - Processing document 4_2024-03-15
2025-11-14 17:40:38,149 - INFO - Finished converting document 4_2024-03-15 in 0.03 sec.
2025-11-14 17:40:38,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:38,195 - INFO - Going to convert document batch...
2025-11-14 17:40:38,195 - INFO - Processing document 4_2024-03-22
2025-11-14 17:40:38,216 - INFO - Finished converting document 4_2024-03-22 in 0.05 sec.
2025-11-14 17:40:38,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:38,273 - INFO - Going to convert document batch...
2025-11-14 17:40:38,274 - INFO - Processing document 4_2024-04-11
2025-11-14 17:40:38,294 - INFO - Finished converting document 4_2024-04-11 in 0.06 sec.
2025-11-14 17:40:38,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:38,335 - INFO - Going to convert document batch...
2025-11-14 17:40:38,336 - 

Converted 'data\edgar_documents\TGT\4_2024-03-15' --> 'data\processed_data\TGT\4_2024-03-15.md'
Converted 'data\edgar_documents\TGT\4_2024-03-22' --> 'data\processed_data\TGT\4_2024-03-22.md'
Converted 'data\edgar_documents\TGT\4_2024-04-11' --> 'data\processed_data\TGT\4_2024-04-11.md'


2025-11-14 17:40:38,389 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:38,396 - INFO - Going to convert document batch...
2025-11-14 17:40:38,397 - INFO - Processing document 4_2024-08-23
2025-11-14 17:40:38,417 - INFO - Finished converting document 4_2024-08-23 in 0.05 sec.
2025-11-14 17:40:38,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:38,459 - INFO - Going to convert document batch...
2025-11-14 17:40:38,460 - INFO - Processing document 4_2024-08-28
2025-11-14 17:40:38,479 - INFO - Finished converting document 4_2024-08-28 in 0.05 sec.
2025-11-14 17:40:38,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:38,536 - INFO - Going to convert document batch...
2025-11-14 17:40:38,537 - INFO - Processing document 4_2024-09-03
2025-11-14 17:40:38,558 - INFO - Finished converting document 4_2024-09-03 in 0.06 sec.


Converted 'data\edgar_documents\TGT\4_2024-06-05' --> 'data\processed_data\TGT\4_2024-06-05.md'
Converted 'data\edgar_documents\TGT\4_2024-08-23' --> 'data\processed_data\TGT\4_2024-08-23.md'
Converted 'data\edgar_documents\TGT\4_2024-08-28' --> 'data\processed_data\TGT\4_2024-08-28.md'


2025-11-14 17:40:38,600 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:40:38,601 - ERROR - Input document 4_2024-09-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:40:38,603 - INFO - Going to convert document batch...
2025-11-14 17:40:38,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:38,624 - INFO - Going to convert document batch...
2025-11-14 17:40:38,625 - INFO - Processing document 4_2024-09-30
2025-11-14 17:40:38,645 - INFO - Fin

Converted 'data\edgar_documents\TGT\4_2024-09-03' --> 'data\processed_data\TGT\4_2024-09-03.md'
Error processing data\edgar_documents\TGT\4_2024-09-04: File format not allowed: data\edgar_documents\TGT\4_2024-09-04
Converted 'data\edgar_documents\TGT\4_2024-09-30' --> 'data\processed_data\TGT\4_2024-09-30.md'


2025-11-14 17:40:39,031 - INFO - Finished converting document 4_2024-10-02 in 0.36 sec.
2025-11-14 17:40:39,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:39,082 - INFO - Going to convert document batch...
2025-11-14 17:40:39,083 - INFO - Processing document 4_2025-01-31
2025-11-14 17:40:39,103 - INFO - Finished converting document 4_2025-01-31 in 0.03 sec.
2025-11-14 17:40:39,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:39,145 - INFO - Going to convert document batch...
2025-11-14 17:40:39,146 - INFO - Processing document 4_2025-03-10
2025-11-14 17:40:39,164 - INFO - Finished converting document 4_2025-03-10 in 0.03 sec.
2025-11-14 17:40:39,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:39,220 - INFO - Going to convert document batch...
2025-11-14 17:40:39,220 - INFO - Processing document 4_2025-03-12
2025-11-14 17:40:39,239 - INFO - Finished converting document 4_2025-03-12 in 0.05 sec.


Converted 'data\edgar_documents\TGT\4_2024-10-02' --> 'data\processed_data\TGT\4_2024-10-02.md'
Converted 'data\edgar_documents\TGT\4_2025-01-31' --> 'data\processed_data\TGT\4_2025-01-31.md'
Converted 'data\edgar_documents\TGT\4_2025-03-10' --> 'data\processed_data\TGT\4_2025-03-10.md'


2025-11-14 17:40:39,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:39,281 - INFO - Going to convert document batch...
2025-11-14 17:40:39,282 - INFO - Processing document 4_2025-03-14
2025-11-14 17:40:39,303 - INFO - Finished converting document 4_2025-03-14 in 0.03 sec.
2025-11-14 17:40:39,346 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:40:39,346 - ERROR - Input document 4_2025-03-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:40

Converted 'data\edgar_documents\TGT\4_2025-03-12' --> 'data\processed_data\TGT\4_2025-03-12.md'
Converted 'data\edgar_documents\TGT\4_2025-03-14' --> 'data\processed_data\TGT\4_2025-03-14.md'
Error processing data\edgar_documents\TGT\4_2025-03-20: File format not allowed: data\edgar_documents\TGT\4_2025-03-20
Error processing data\edgar_documents\TGT\4_2025-03-21: File format not allowed: data\edgar_documents\TGT\4_2025-03-21
Converted 'data\edgar_documents\TGT\4_2025-04-10' --> 'data\processed_data\TGT\4_2025-04-10.md'


2025-11-14 17:40:39,451 - INFO - Processing document 4_2025-05-30
2025-11-14 17:40:39,470 - INFO - Finished converting document 4_2025-05-30 in 0.05 sec.
2025-11-14 17:40:39,532 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:40:39,532 - ERROR - Input document 4_2025-06-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:40:39,534 - INFO - Going to convert document batch...
2025-11-14 17:40:39,556 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\TGT\4_2025-05-30' --> 'data\processed_data\TGT\4_2025-05-30.md'
Error processing data\edgar_documents\TGT\4_2025-06-05: File format not allowed: data\edgar_documents\TGT\4_2025-06-05
Error processing data\edgar_documents\TGT\4_2025-06-06: File format not allowed: data\edgar_documents\TGT\4_2025-06-06
Converted 'data\edgar_documents\TGT\4_2025-06-12' --> 'data\processed_data\TGT\4_2025-06-12.md'


2025-11-14 17:40:39,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:39,712 - INFO - Going to convert document batch...
2025-11-14 17:40:39,713 - INFO - Processing document 4_2025-11-04
2025-11-14 17:40:39,734 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 17:40:39,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:39,811 - INFO - Going to convert document batch...
2025-11-14 17:40:39,813 - INFO - Processing document 8-K_2023-01-12
2025-11-14 17:40:39,847 - INFO - Finished converting document 8-K_2023-01-12 in 0.09 sec.
2025-11-14 17:40:39,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\4_2025-10-02' --> 'data\processed_data\TGT\4_2025-10-02.md'
Converted 'data\edgar_documents\TGT\4_2025-11-04' --> 'data\processed_data\TGT\4_2025-11-04.md'
Converted 'data\edgar_documents\TGT\8-K_2023-01-12' --> 'data\processed_data\TGT\8-K_2023-01-12.md'


2025-11-14 17:40:39,889 - INFO - Going to convert document batch...
2025-11-14 17:40:39,890 - INFO - Processing document 8-K_2023-01-24
2025-11-14 17:40:39,913 - INFO - Finished converting document 8-K_2023-01-24 in 0.05 sec.
2025-11-14 17:40:39,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:39,959 - INFO - Going to convert document batch...
2025-11-14 17:40:39,959 - INFO - Processing document 8-K_2023-02-14
2025-11-14 17:40:39,976 - INFO - Finished converting document 8-K_2023-02-14 in 0.05 sec.
2025-11-14 17:40:39,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,014 - INFO - Going to convert document batch...
2025-11-14 17:40:40,015 - INFO - Processing document 8-K_2023-02-28
2025-11-14 17:40:40,034 - INFO - Finished converting document 8-K_2023-02-28 in 0.05 sec.
2025-11-14 17:40:40,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,070 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\TGT\8-K_2023-01-24' --> 'data\processed_data\TGT\8-K_2023-01-24.md'
Converted 'data\edgar_documents\TGT\8-K_2023-02-14' --> 'data\processed_data\TGT\8-K_2023-02-14.md'
Converted 'data\edgar_documents\TGT\8-K_2023-02-28' --> 'data\processed_data\TGT\8-K_2023-02-28.md'
Converted 'data\edgar_documents\TGT\8-K_2023-05-17' --> 'data\processed_data\TGT\8-K_2023-05-17.md'


2025-11-14 17:40:40,145 - INFO - Going to convert document batch...
2025-11-14 17:40:40,146 - INFO - Processing document 8-K_2023-06-15
2025-11-14 17:40:40,193 - INFO - Finished converting document 8-K_2023-06-15 in 0.09 sec.
2025-11-14 17:40:40,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,244 - INFO - Going to convert document batch...
2025-11-14 17:40:40,246 - INFO - Processing document 8-K_2023-08-16
2025-11-14 17:40:40,268 - INFO - Finished converting document 8-K_2023-08-16 in 0.05 sec.
2025-11-14 17:40:40,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,306 - INFO - Going to convert document batch...
2025-11-14 17:40:40,307 - INFO - Processing document 8-K_2023-10-17
2025-11-14 17:40:40,322 - INFO - Finished converting document 8-K_2023-10-17 in 0.03 sec.
2025-11-14 17:40:40,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,353 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\TGT\8-K_2023-06-15' --> 'data\processed_data\TGT\8-K_2023-06-15.md'
Converted 'data\edgar_documents\TGT\8-K_2023-08-16' --> 'data\processed_data\TGT\8-K_2023-08-16.md'
Converted 'data\edgar_documents\TGT\8-K_2023-10-17' --> 'data\processed_data\TGT\8-K_2023-10-17.md'
Converted 'data\edgar_documents\TGT\8-K_2023-10-18' --> 'data\processed_data\TGT\8-K_2023-10-18.md'


2025-11-14 17:40:40,404 - INFO - Processing document 8-K_2023-11-08
2025-11-14 17:40:40,423 - INFO - Finished converting document 8-K_2023-11-08 in 0.05 sec.
2025-11-14 17:40:40,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,458 - INFO - Going to convert document batch...
2025-11-14 17:40:40,458 - INFO - Processing document 8-K_2023-11-15
2025-11-14 17:40:40,479 - INFO - Finished converting document 8-K_2023-11-15 in 0.06 sec.
2025-11-14 17:40:40,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,544 - INFO - Going to convert document batch...
2025-11-14 17:40:40,546 - INFO - Processing document 8-K_2024-01-18
2025-11-14 17:40:40,564 - INFO - Finished converting document 8-K_2024-01-18 in 0.08 sec.
2025-11-14 17:40:40,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,593 - INFO - Going to convert document batch...
2025-11-14 17:40:40,594 - INFO - Processing document 8-K_2024-03-05


Converted 'data\edgar_documents\TGT\8-K_2023-11-08' --> 'data\processed_data\TGT\8-K_2023-11-08.md'
Converted 'data\edgar_documents\TGT\8-K_2023-11-15' --> 'data\processed_data\TGT\8-K_2023-11-15.md'
Converted 'data\edgar_documents\TGT\8-K_2024-01-18' --> 'data\processed_data\TGT\8-K_2024-01-18.md'


2025-11-14 17:40:40,613 - INFO - Finished converting document 8-K_2024-03-05 in 0.03 sec.
2025-11-14 17:40:40,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,645 - INFO - Going to convert document batch...
2025-11-14 17:40:40,646 - INFO - Processing document 8-K_2024-05-22
2025-11-14 17:40:40,672 - INFO - Finished converting document 8-K_2024-05-22 in 0.05 sec.
2025-11-14 17:40:40,716 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,746 - INFO - Going to convert document batch...
2025-11-14 17:40:40,747 - INFO - Processing document 8-K_2024-06-14
2025-11-14 17:40:40,800 - INFO - Finished converting document 8-K_2024-06-14 in 0.11 sec.


Converted 'data\edgar_documents\TGT\8-K_2024-03-05' --> 'data\processed_data\TGT\8-K_2024-03-05.md'
Converted 'data\edgar_documents\TGT\8-K_2024-05-22' --> 'data\processed_data\TGT\8-K_2024-05-22.md'
Converted 'data\edgar_documents\TGT\8-K_2024-06-14' --> 'data\processed_data\TGT\8-K_2024-06-14.md'


2025-11-14 17:40:40,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,866 - INFO - Going to convert document batch...
2025-11-14 17:40:40,867 - INFO - Processing document 8-K_2024-08-13
2025-11-14 17:40:40,885 - INFO - Finished converting document 8-K_2024-08-13 in 0.06 sec.
2025-11-14 17:40:40,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:40,922 - INFO - Going to convert document batch...
2025-11-14 17:40:40,923 - INFO - Processing document 8-K_2024-08-21
2025-11-14 17:40:40,952 - INFO - Finished converting document 8-K_2024-08-21 in 0.06 sec.
2025-11-14 17:40:40,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:41,012 - INFO - Going to convert document batch...
2025-11-14 17:40:41,013 - INFO - Processing document 8-K_2024-09-06
2025-11-14 17:40:41,031 - INFO - Finished converting document 8-K_2024-09-06 in 0.06 sec.
2025-11-14 17:40:41,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\TGT\8-K_2024-08-13' --> 'data\processed_data\TGT\8-K_2024-08-13.md'
Converted 'data\edgar_documents\TGT\8-K_2024-08-21' --> 'data\processed_data\TGT\8-K_2024-08-21.md'
Converted 'data\edgar_documents\TGT\8-K_2024-09-06' --> 'data\processed_data\TGT\8-K_2024-09-06.md'


2025-11-14 17:40:41,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:41,110 - INFO - Going to convert document batch...
2025-11-14 17:40:41,111 - INFO - Processing document 8-K_2024-10-15
2025-11-14 17:40:41,131 - INFO - Finished converting document 8-K_2024-10-15 in 0.03 sec.
2025-11-14 17:40:41,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:41,163 - INFO - Going to convert document batch...
2025-11-14 17:40:41,164 - INFO - Processing document 8-K_2024-11-20
2025-11-14 17:40:41,185 - INFO - Finished converting document 8-K_2024-11-20 in 0.05 sec.
2025-11-14 17:40:41,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:41,219 - INFO - Going to convert document batch...
2025-11-14 17:40:41,219 - INFO - Processing document 8-K_2025-01-17
2025-11-14 17:40:41,240 - INFO - Finished converting document 8-K_2025-01-17 in 0.05 sec.
2025-11-14 17:40:41,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\TGT\8-K_2024-09-19' --> 'data\processed_data\TGT\8-K_2024-09-19.md'
Converted 'data\edgar_documents\TGT\8-K_2024-10-15' --> 'data\processed_data\TGT\8-K_2024-10-15.md'
Converted 'data\edgar_documents\TGT\8-K_2024-11-20' --> 'data\processed_data\TGT\8-K_2024-11-20.md'
Converted 'data\edgar_documents\TGT\8-K_2025-01-17' --> 'data\processed_data\TGT\8-K_2025-01-17.md'


2025-11-14 17:40:41,291 - INFO - Finished converting document 8-K_2025-03-04 in 0.05 sec.
2025-11-14 17:40:41,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:41,320 - INFO - Going to convert document batch...
2025-11-14 17:40:41,320 - INFO - Processing document 8-K_2025-03-25
2025-11-14 17:40:41,338 - INFO - Finished converting document 8-K_2025-03-25 in 0.03 sec.
2025-11-14 17:40:41,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:41,396 - INFO - Going to convert document batch...
2025-11-14 17:40:41,396 - INFO - Processing document 8-K_2025-04-10
2025-11-14 17:40:41,412 - INFO - Finished converting document 8-K_2025-04-10 in 0.06 sec.
2025-11-14 17:40:41,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:41,447 - INFO - Going to convert document batch...
2025-11-14 17:40:41,447 - INFO - Processing document 8-K_2025-05-21
2025-11-14 17:40:41,469 - INFO - Finished converting document 8-K_2025-05-21 in 0.

Converted 'data\edgar_documents\TGT\8-K_2025-03-04' --> 'data\processed_data\TGT\8-K_2025-03-04.md'
Converted 'data\edgar_documents\TGT\8-K_2025-03-25' --> 'data\processed_data\TGT\8-K_2025-03-25.md'
Converted 'data\edgar_documents\TGT\8-K_2025-04-10' --> 'data\processed_data\TGT\8-K_2025-04-10.md'
Converted 'data\edgar_documents\TGT\8-K_2025-05-21' --> 'data\processed_data\TGT\8-K_2025-05-21.md'


2025-11-14 17:40:41,501 - INFO - Going to convert document batch...
2025-11-14 17:40:41,502 - INFO - Processing document 8-K_2025-06-10
2025-11-14 17:40:41,519 - INFO - Finished converting document 8-K_2025-06-10 in 0.03 sec.
2025-11-14 17:40:41,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:41,563 - INFO - Going to convert document batch...
2025-11-14 17:40:41,564 - INFO - Processing document 8-K_2025-06-13
2025-11-14 17:40:41,604 - INFO - Finished converting document 8-K_2025-06-13 in 0.08 sec.
2025-11-14 17:40:41,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:40:41,670 - INFO - Going to convert document batch...
2025-11-14 17:40:41,671 - INFO - Processing document 8-K_2025-08-20
2025-11-14 17:40:41,691 - INFO - Finished converting document 8-K_2025-08-20 in 0.06 sec.
2025-11-14 17:40:41,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\8-K_2025-06-10' --> 'data\processed_data\TGT\8-K_2025-06-10.md'
Converted 'data\edgar_documents\TGT\8-K_2025-06-13' --> 'data\processed_data\TGT\8-K_2025-06-13.md'
Converted 'data\edgar_documents\TGT\8-K_2025-08-20' --> 'data\processed_data\TGT\8-K_2025-08-20.md'


2025-11-14 17:40:41,724 - INFO - Going to convert document batch...
2025-11-14 17:40:41,724 - INFO - Processing document 8-K_2025-10-09
2025-11-14 17:40:41,740 - INFO - Finished converting document 8-K_2025-10-09 in 0.03 sec.
2025-11-14 17:40:41,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\8-K_2025-10-09' --> 'data\processed_data\TGT\8-K_2025-10-09.md'


2025-11-14 17:40:42,464 - INFO - Going to convert document batch...
2025-11-14 17:40:42,465 - INFO - Processing document DEF-14A_2023-05-01
2025-11-14 17:40:43,464 - INFO - Finished converting document DEF-14A_2023-05-01 in 1.72 sec.
2025-11-14 17:40:44,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\DEF-14A_2023-05-01' --> 'data\processed_data\TGT\DEF-14A_2023-05-01.md'


2025-11-14 17:40:44,920 - INFO - Going to convert document batch...
2025-11-14 17:40:44,921 - INFO - Processing document DEF-14A_2024-04-29
2025-11-14 17:40:46,045 - INFO - Finished converting document DEF-14A_2024-04-29 in 1.81 sec.
2025-11-14 17:40:47,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\DEF-14A_2024-04-29' --> 'data\processed_data\TGT\DEF-14A_2024-04-29.md'


2025-11-14 17:40:48,601 - INFO - Going to convert document batch...
2025-11-14 17:40:48,602 - INFO - Processing document DEF-14A_2025-04-28
2025-11-14 17:40:51,309 - INFO - Finished converting document DEF-14A_2025-04-28 in 4.00 sec.
2025-11-14 17:40:51,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TGT\DEF-14A_2025-04-28' --> 'data\processed_data\TGT\DEF-14A_2025-04-28.md'
Processed 78 new files. Errors: 7
Found 135 files to process in data\edgar_documents\TMO


2025-11-14 17:40:52,626 - INFO - Going to convert document batch...
2025-11-14 17:40:52,627 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:40:52,627 - INFO - Processing document 10-K_2023-02-23
2025-11-14 17:40:54,134 - INFO - Finished converting document 10-K_2023-02-23 in 2.28 sec.
2025-11-14 17:40:54,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-K_2023-02-23' --> 'data\processed_data\TMO\10-K_2023-02-23.md'


2025-11-14 17:40:55,850 - INFO - Going to convert document batch...
2025-11-14 17:40:55,851 - INFO - Processing document 10-K_2024-02-22
2025-11-14 17:40:57,230 - INFO - Finished converting document 10-K_2024-02-22 in 2.50 sec.
2025-11-14 17:40:57,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-K_2024-02-22' --> 'data\processed_data\TMO\10-K_2024-02-22.md'


2025-11-14 17:40:58,949 - INFO - Going to convert document batch...
2025-11-14 17:40:58,951 - INFO - Processing document 10-K_2025-02-20
2025-11-14 17:41:00,347 - INFO - Finished converting document 10-K_2025-02-20 in 2.45 sec.
2025-11-14 17:41:01,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-K_2025-02-20' --> 'data\processed_data\TMO\10-K_2025-02-20.md'


2025-11-14 17:41:01,886 - INFO - Going to convert document batch...
2025-11-14 17:41:01,887 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 17:41:02,581 - INFO - Finished converting document 10-Q_2023-05-05 in 1.56 sec.
2025-11-14 17:41:02,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-Q_2023-05-05' --> 'data\processed_data\TMO\10-Q_2023-05-05.md'


2025-11-14 17:41:03,404 - INFO - Going to convert document batch...
2025-11-14 17:41:03,405 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 17:41:04,281 - INFO - Finished converting document 10-Q_2023-08-04 in 1.34 sec.
2025-11-14 17:41:04,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-Q_2023-08-04' --> 'data\processed_data\TMO\10-Q_2023-08-04.md'


2025-11-14 17:41:05,606 - INFO - Going to convert document batch...
2025-11-14 17:41:05,607 - INFO - Processing document 10-Q_2023-11-03
2025-11-14 17:41:06,483 - INFO - Finished converting document 10-Q_2023-11-03 in 1.76 sec.
2025-11-14 17:41:06,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-Q_2023-11-03' --> 'data\processed_data\TMO\10-Q_2023-11-03.md'


2025-11-14 17:41:07,322 - INFO - Going to convert document batch...
2025-11-14 17:41:07,323 - INFO - Processing document 10-Q_2024-05-03
2025-11-14 17:41:08,399 - INFO - Finished converting document 10-Q_2024-05-03 in 1.45 sec.
2025-11-14 17:41:08,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-Q_2024-05-03' --> 'data\processed_data\TMO\10-Q_2024-05-03.md'


2025-11-14 17:41:09,353 - INFO - Going to convert document batch...
2025-11-14 17:41:09,354 - INFO - Processing document 10-Q_2024-08-02
2025-11-14 17:41:10,308 - INFO - Finished converting document 10-Q_2024-08-02 in 1.48 sec.
2025-11-14 17:41:10,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-Q_2024-08-02' --> 'data\processed_data\TMO\10-Q_2024-08-02.md'


2025-11-14 17:41:11,650 - INFO - Going to convert document batch...
2025-11-14 17:41:11,651 - INFO - Processing document 10-Q_2024-11-01
2025-11-14 17:41:12,612 - INFO - Finished converting document 10-Q_2024-11-01 in 1.81 sec.
2025-11-14 17:41:13,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-Q_2024-11-01' --> 'data\processed_data\TMO\10-Q_2024-11-01.md'


2025-11-14 17:41:13,926 - INFO - Going to convert document batch...
2025-11-14 17:41:13,927 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 17:41:14,716 - INFO - Finished converting document 10-Q_2025-05-02 in 1.56 sec.
2025-11-14 17:41:15,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-Q_2025-05-02' --> 'data\processed_data\TMO\10-Q_2025-05-02.md'


2025-11-14 17:41:15,674 - INFO - Going to convert document batch...
2025-11-14 17:41:15,675 - INFO - Processing document 10-Q_2025-08-01
2025-11-14 17:41:16,698 - INFO - Finished converting document 10-Q_2025-08-01 in 1.58 sec.
2025-11-14 17:41:17,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-Q_2025-08-01' --> 'data\processed_data\TMO\10-Q_2025-08-01.md'


2025-11-14 17:41:18,222 - INFO - Going to convert document batch...
2025-11-14 17:41:18,223 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 17:41:19,357 - INFO - Finished converting document 10-Q_2025-10-31 in 1.76 sec.
2025-11-14 17:41:20,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:20,104 - INFO - Going to convert document batch...
2025-11-14 17:41:20,107 - INFO - Processing document 4_2023-01-04
2025-11-14 17:41:20,159 - INFO - Finished converting document 4_2023-01-04 in 0.12 sec.
2025-11-14 17:41:20,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\10-Q_2025-10-31' --> 'data\processed_data\TMO\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\TMO\4_2023-01-04' --> 'data\processed_data\TMO\4_2023-01-04.md'


2025-11-14 17:41:20,941 - INFO - Going to convert document batch...
2025-11-14 17:41:20,942 - INFO - Processing document 4_2023-02-07
2025-11-14 17:41:20,983 - INFO - Finished converting document 4_2023-02-07 in 0.76 sec.
2025-11-14 17:41:21,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:21,073 - INFO - Going to convert document batch...
2025-11-14 17:41:21,074 - INFO - Processing document 4_2023-02-13
2025-11-14 17:41:21,113 - INFO - Finished converting document 4_2023-02-13 in 0.08 sec.
2025-11-14 17:41:21,158 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:21,199 - INFO - Going to convert document batch...
2025-11-14 17:41:21,200 - INFO - Processing document 4_2023-02-15


Converted 'data\edgar_documents\TMO\4_2023-02-07' --> 'data\processed_data\TMO\4_2023-02-07.md'
Converted 'data\edgar_documents\TMO\4_2023-02-13' --> 'data\processed_data\TMO\4_2023-02-13.md'


2025-11-14 17:41:21,335 - INFO - Finished converting document 4_2023-02-15 in 0.19 sec.
2025-11-14 17:41:21,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:21,473 - INFO - Going to convert document batch...
2025-11-14 17:41:21,474 - INFO - Processing document 4_2023-02-24
2025-11-14 17:41:21,520 - INFO - Finished converting document 4_2023-02-24 in 0.09 sec.
2025-11-14 17:41:21,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:21,618 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMO\4_2023-02-15' --> 'data\processed_data\TMO\4_2023-02-15.md'
Converted 'data\edgar_documents\TMO\4_2023-02-24' --> 'data\processed_data\TMO\4_2023-02-24.md'


2025-11-14 17:41:21,622 - INFO - Processing document 4_2023-03-02
2025-11-14 17:41:21,666 - INFO - Finished converting document 4_2023-03-02 in 0.09 sec.
2025-11-14 17:41:21,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:21,761 - INFO - Going to convert document batch...
2025-11-14 17:41:21,762 - INFO - Processing document 4_2023-03-07
2025-11-14 17:41:21,816 - INFO - Finished converting document 4_2023-03-07 in 0.09 sec.
2025-11-14 17:41:21,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2023-03-02' --> 'data\processed_data\TMO\4_2023-03-02.md'
Converted 'data\edgar_documents\TMO\4_2023-03-07' --> 'data\processed_data\TMO\4_2023-03-07.md'


2025-11-14 17:41:21,998 - INFO - Going to convert document batch...
2025-11-14 17:41:22,000 - INFO - Processing document 4_2023-03-15
2025-11-14 17:41:22,131 - INFO - Finished converting document 4_2023-03-15 in 0.23 sec.
2025-11-14 17:41:22,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:22,252 - INFO - Going to convert document batch...
2025-11-14 17:41:22,254 - INFO - Processing document 4_2023-04-04
2025-11-14 17:41:22,293 - INFO - Finished converting document 4_2023-04-04 in 0.08 sec.
2025-11-14 17:41:22,354 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:22,370 - INFO - Going to convert document batch...
2025-11-14 17:41:22,372 - INFO - Processing document 4_2023-05-08
2025-11-14 17:41:22,407 - INFO - Finished converting document 4_2023-05-08 in 0.06 sec.


Converted 'data\edgar_documents\TMO\4_2023-03-15' --> 'data\processed_data\TMO\4_2023-03-15.md'
Converted 'data\edgar_documents\TMO\4_2023-04-04' --> 'data\processed_data\TMO\4_2023-04-04.md'


2025-11-14 17:41:22,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:22,516 - INFO - Going to convert document batch...
2025-11-14 17:41:22,517 - INFO - Processing document 4_2023-05-10
2025-11-14 17:41:22,645 - INFO - Finished converting document 4_2023-05-10 in 0.19 sec.


Converted 'data\edgar_documents\TMO\4_2023-05-08' --> 'data\processed_data\TMO\4_2023-05-08.md'


2025-11-14 17:41:22,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:22,777 - INFO - Going to convert document batch...
2025-11-14 17:41:22,779 - INFO - Processing document 4_2023-05-15
2025-11-14 17:41:22,825 - INFO - Finished converting document 4_2023-05-15 in 0.09 sec.
2025-11-14 17:41:22,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:22,911 - INFO - Going to convert document batch...
2025-11-14 17:41:22,912 - INFO - Processing document 4_2023-05-19


Converted 'data\edgar_documents\TMO\4_2023-05-10' --> 'data\processed_data\TMO\4_2023-05-10.md'
Converted 'data\edgar_documents\TMO\4_2023-05-15' --> 'data\processed_data\TMO\4_2023-05-15.md'


2025-11-14 17:41:22,951 - INFO - Finished converting document 4_2023-05-19 in 0.08 sec.
2025-11-14 17:41:23,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:23,037 - INFO - Going to convert document batch...
2025-11-14 17:41:23,038 - INFO - Processing document 4_2023-05-26
2025-11-14 17:41:23,071 - INFO - Finished converting document 4_2023-05-26 in 0.06 sec.
2025-11-14 17:41:23,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:23,187 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMO\4_2023-05-19' --> 'data\processed_data\TMO\4_2023-05-19.md'
Converted 'data\edgar_documents\TMO\4_2023-05-26' --> 'data\processed_data\TMO\4_2023-05-26.md'


2025-11-14 17:41:23,188 - INFO - Processing document 4_2023-07-05
2025-11-14 17:41:23,225 - INFO - Finished converting document 4_2023-07-05 in 0.08 sec.
2025-11-14 17:41:23,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:23,305 - INFO - Going to convert document batch...
2025-11-14 17:41:23,306 - INFO - Processing document 4_2023-08-02
2025-11-14 17:41:23,353 - INFO - Finished converting document 4_2023-08-02 in 0.08 sec.
2025-11-14 17:41:23,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2023-07-05' --> 'data\processed_data\TMO\4_2023-07-05.md'
Converted 'data\edgar_documents\TMO\4_2023-08-02' --> 'data\processed_data\TMO\4_2023-08-02.md'


2025-11-14 17:41:23,460 - INFO - Going to convert document batch...
2025-11-14 17:41:23,461 - INFO - Processing document 4_2023-08-07
2025-11-14 17:41:23,597 - INFO - Finished converting document 4_2023-08-07 in 0.20 sec.
2025-11-14 17:41:23,713 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:41:23,714 - ERROR - Input document 4_2023-08-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:41:23,716 - INFO - Going to convert document batch...
2025-11-14 17:41:23,729 - IN

Converted 'data\edgar_documents\TMO\4_2023-08-07' --> 'data\processed_data\TMO\4_2023-08-07.md'
Error processing data\edgar_documents\TMO\4_2023-08-08: File format not allowed: data\edgar_documents\TMO\4_2023-08-08


2025-11-14 17:41:24,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:24,058 - INFO - Going to convert document batch...
2025-11-14 17:41:24,059 - INFO - Processing document 4_2023-08-25
2025-11-14 17:41:24,114 - INFO - Finished converting document 4_2023-08-25 in 0.09 sec.
2025-11-14 17:41:24,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2023-08-09' --> 'data\processed_data\TMO\4_2023-08-09.md'
Converted 'data\edgar_documents\TMO\4_2023-08-25' --> 'data\processed_data\TMO\4_2023-08-25.md'


2025-11-14 17:41:24,224 - INFO - Going to convert document batch...
2025-11-14 17:41:24,226 - INFO - Processing document 4_2023-08-29
2025-11-14 17:41:24,262 - INFO - Finished converting document 4_2023-08-29 in 0.09 sec.
2025-11-14 17:41:24,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:24,329 - INFO - Going to convert document batch...
2025-11-14 17:41:24,330 - INFO - Processing document 4_2023-08-31
2025-11-14 17:41:24,372 - INFO - Finished converting document 4_2023-08-31 in 0.08 sec.
2025-11-14 17:41:24,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:24,453 - INFO - Going to convert document batch...
2025-11-14 17:41:24,454 - INFO - Processing document 4_2023-10-03


Converted 'data\edgar_documents\TMO\4_2023-08-29' --> 'data\processed_data\TMO\4_2023-08-29.md'
Converted 'data\edgar_documents\TMO\4_2023-08-31' --> 'data\processed_data\TMO\4_2023-08-31.md'


2025-11-14 17:41:24,505 - INFO - Finished converting document 4_2023-10-03 in 0.08 sec.
2025-11-14 17:41:24,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:24,598 - INFO - Going to convert document batch...
2025-11-14 17:41:24,601 - INFO - Processing document 4_2023-10-06
2025-11-14 17:41:24,667 - INFO - Finished converting document 4_2023-10-06 in 0.12 sec.
2025-11-14 17:41:24,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2023-10-03' --> 'data\processed_data\TMO\4_2023-10-03.md'
Converted 'data\edgar_documents\TMO\4_2023-10-06' --> 'data\processed_data\TMO\4_2023-10-06.md'


2025-11-14 17:41:24,807 - INFO - Going to convert document batch...
2025-11-14 17:41:24,808 - INFO - Processing document 4_2023-11-06
2025-11-14 17:41:24,939 - INFO - Finished converting document 4_2023-11-06 in 0.22 sec.
2025-11-14 17:41:25,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:25,109 - INFO - Going to convert document batch...
2025-11-14 17:41:25,110 - INFO - Processing document 4_2023-11-08


Converted 'data\edgar_documents\TMO\4_2023-11-06' --> 'data\processed_data\TMO\4_2023-11-06.md'


2025-11-14 17:41:25,241 - INFO - Finished converting document 4_2023-11-08 in 0.20 sec.
2025-11-14 17:41:25,388 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:41:25,389 - ERROR - Input document 4_2023-11-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:41:25,392 - INFO - Going to convert document batch...
2025-11-14 17:41:25,437 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:41:25,439 - ERROR - Input document 4_2023-11-29 with forma

Converted 'data\edgar_documents\TMO\4_2023-11-08' --> 'data\processed_data\TMO\4_2023-11-08.md'
Error processing data\edgar_documents\TMO\4_2023-11-28: File format not allowed: data\edgar_documents\TMO\4_2023-11-28
Error processing data\edgar_documents\TMO\4_2023-11-29: File format not allowed: data\edgar_documents\TMO\4_2023-11-29


2025-11-14 17:41:25,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:25,633 - INFO - Going to convert document batch...
2025-11-14 17:41:25,634 - INFO - Processing document 4_2023-12-11
2025-11-14 17:41:25,673 - INFO - Finished converting document 4_2023-12-11 in 0.08 sec.
2025-11-14 17:41:25,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2023-11-30' --> 'data\processed_data\TMO\4_2023-11-30.md'
Converted 'data\edgar_documents\TMO\4_2023-12-11' --> 'data\processed_data\TMO\4_2023-12-11.md'


2025-11-14 17:41:25,793 - INFO - Going to convert document batch...
2025-11-14 17:41:25,796 - INFO - Processing document 4_2024-01-03
2025-11-14 17:41:25,851 - INFO - Finished converting document 4_2024-01-03 in 0.12 sec.
2025-11-14 17:41:25,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:25,922 - INFO - Going to convert document batch...
2025-11-14 17:41:25,923 - INFO - Processing document 4_2024-02-08
2025-11-14 17:41:25,979 - INFO - Finished converting document 4_2024-02-08 in 0.09 sec.
2025-11-14 17:41:26,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:26,060 - INFO - Going to convert document batch...
2025-11-14 17:41:26,060 - INFO - Processing document 4_2024-02-14


Converted 'data\edgar_documents\TMO\4_2024-01-03' --> 'data\processed_data\TMO\4_2024-01-03.md'
Converted 'data\edgar_documents\TMO\4_2024-02-08' --> 'data\processed_data\TMO\4_2024-02-08.md'


2025-11-14 17:41:26,103 - INFO - Finished converting document 4_2024-02-14 in 0.06 sec.
2025-11-14 17:41:26,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:26,206 - INFO - Going to convert document batch...
2025-11-14 17:41:26,208 - INFO - Processing document 4_2024-02-20
2025-11-14 17:41:26,252 - INFO - Finished converting document 4_2024-02-20 in 0.09 sec.
2025-11-14 17:41:26,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:26,340 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMO\4_2024-02-14' --> 'data\processed_data\TMO\4_2024-02-14.md'
Converted 'data\edgar_documents\TMO\4_2024-02-20' --> 'data\processed_data\TMO\4_2024-02-20.md'


2025-11-14 17:41:26,341 - INFO - Processing document 4_2024-02-23
2025-11-14 17:41:26,390 - INFO - Finished converting document 4_2024-02-23 in 0.09 sec.
2025-11-14 17:41:26,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:26,495 - INFO - Going to convert document batch...
2025-11-14 17:41:26,497 - INFO - Processing document 4_2024-02-26
2025-11-14 17:41:26,551 - INFO - Finished converting document 4_2024-02-26 in 0.12 sec.


Converted 'data\edgar_documents\TMO\4_2024-02-23' --> 'data\processed_data\TMO\4_2024-02-23.md'
Converted 'data\edgar_documents\TMO\4_2024-02-26' --> 'data\processed_data\TMO\4_2024-02-26.md'


2025-11-14 17:41:26,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:26,668 - INFO - Going to convert document batch...
2025-11-14 17:41:26,669 - INFO - Processing document 4_2024-02-29
2025-11-14 17:41:26,842 - INFO - Finished converting document 4_2024-02-29 in 0.25 sec.
2025-11-14 17:41:26,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:26,961 - INFO - Going to convert document batch...
2025-11-14 17:41:26,964 - INFO - Processing document 4_2024-03-04
2025-11-14 17:41:27,082 - INFO - Finished converting document 4_2024-03-04 in 0.16 sec.


Converted 'data\edgar_documents\TMO\4_2024-02-29' --> 'data\processed_data\TMO\4_2024-02-29.md'


2025-11-14 17:41:27,206 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:27,275 - INFO - Going to convert document batch...
2025-11-14 17:41:27,276 - INFO - Processing document 4_2024-03-13


Converted 'data\edgar_documents\TMO\4_2024-03-04' --> 'data\processed_data\TMO\4_2024-03-04.md'


2025-11-14 17:41:27,390 - INFO - Finished converting document 4_2024-03-13 in 0.22 sec.
2025-11-14 17:41:27,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:27,534 - INFO - Going to convert document batch...
2025-11-14 17:41:27,536 - INFO - Processing document 4_2024-03-14


Converted 'data\edgar_documents\TMO\4_2024-03-13' --> 'data\processed_data\TMO\4_2024-03-13.md'


2025-11-14 17:41:27,715 - INFO - Finished converting document 4_2024-03-14 in 0.25 sec.
2025-11-14 17:41:27,826 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:27,843 - INFO - Going to convert document batch...
2025-11-14 17:41:27,844 - INFO - Processing document 4_2024-03-27
2025-11-14 17:41:27,881 - INFO - Finished converting document 4_2024-03-27 in 0.08 sec.
2025-11-14 17:41:27,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:27,967 - INFO - Going to convert document batch...
2025-11-14 17:41:27,969 - INFO - Processing document 4_2024-04-02


Converted 'data\edgar_documents\TMO\4_2024-03-14' --> 'data\processed_data\TMO\4_2024-03-14.md'
Converted 'data\edgar_documents\TMO\4_2024-03-27' --> 'data\processed_data\TMO\4_2024-03-27.md'


2025-11-14 17:41:28,009 - INFO - Finished converting document 4_2024-04-02 in 0.08 sec.
2025-11-14 17:41:28,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2024-04-02' --> 'data\processed_data\TMO\4_2024-04-02.md'


2025-11-14 17:41:28,668 - INFO - Going to convert document batch...
2025-11-14 17:41:28,670 - INFO - Processing document 4_2024-04-29
2025-11-14 17:41:28,733 - INFO - Finished converting document 4_2024-04-29 in 0.66 sec.
2025-11-14 17:41:28,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:28,886 - INFO - Going to convert document batch...
2025-11-14 17:41:28,887 - INFO - Processing document 4_2024-05-01


Converted 'data\edgar_documents\TMO\4_2024-04-29' --> 'data\processed_data\TMO\4_2024-04-29.md'


2025-11-14 17:41:29,020 - INFO - Finished converting document 4_2024-05-01 in 0.22 sec.
2025-11-14 17:41:29,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2024-05-01' --> 'data\processed_data\TMO\4_2024-05-01.md'


2025-11-14 17:41:29,384 - INFO - Going to convert document batch...
2025-11-14 17:41:29,386 - INFO - Processing document 4_2024-05-02
2025-11-14 17:41:29,471 - INFO - Finished converting document 4_2024-05-02 in 0.31 sec.
2025-11-14 17:41:29,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:29,572 - INFO - Going to convert document batch...
2025-11-14 17:41:29,573 - INFO - Processing document 4_2024-05-06
2025-11-14 17:41:29,662 - INFO - Finished converting document 4_2024-05-06 in 0.12 sec.
2025-11-14 17:41:29,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2024-05-02' --> 'data\processed_data\TMO\4_2024-05-02.md'
Converted 'data\edgar_documents\TMO\4_2024-05-06' --> 'data\processed_data\TMO\4_2024-05-06.md'


2025-11-14 17:41:29,751 - INFO - Going to convert document batch...
2025-11-14 17:41:29,752 - INFO - Processing document 4_2024-05-14
2025-11-14 17:41:29,792 - INFO - Finished converting document 4_2024-05-14 in 0.09 sec.
2025-11-14 17:41:29,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:29,865 - INFO - Going to convert document batch...
2025-11-14 17:41:29,866 - INFO - Processing document 4_2024-05-15
2025-11-14 17:41:29,913 - INFO - Finished converting document 4_2024-05-15 in 0.08 sec.
2025-11-14 17:41:29,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:29,992 - INFO - Going to convert document batch...
2025-11-14 17:41:29,993 - INFO - Processing document 4_2024-05-23


Converted 'data\edgar_documents\TMO\4_2024-05-14' --> 'data\processed_data\TMO\4_2024-05-14.md'
Converted 'data\edgar_documents\TMO\4_2024-05-15' --> 'data\processed_data\TMO\4_2024-05-15.md'


2025-11-14 17:41:30,030 - INFO - Finished converting document 4_2024-05-23 in 0.08 sec.
2025-11-14 17:41:30,086 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:30,104 - INFO - Going to convert document batch...
2025-11-14 17:41:30,105 - INFO - Processing document 4_2024-05-29
2025-11-14 17:41:30,151 - INFO - Finished converting document 4_2024-05-29 in 0.09 sec.
2025-11-14 17:41:30,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2024-05-23' --> 'data\processed_data\TMO\4_2024-05-23.md'
Converted 'data\edgar_documents\TMO\4_2024-05-29' --> 'data\processed_data\TMO\4_2024-05-29.md'


2025-11-14 17:41:30,293 - INFO - Going to convert document batch...
2025-11-14 17:41:30,295 - INFO - Processing document 4_2024-06-05
2025-11-14 17:41:30,379 - INFO - Finished converting document 4_2024-06-05 in 0.17 sec.
2025-11-14 17:41:30,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:30,475 - INFO - Going to convert document batch...
2025-11-14 17:41:30,477 - INFO - Processing document 4_2024-07-02
2025-11-14 17:41:30,512 - INFO - Finished converting document 4_2024-07-02 in 0.08 sec.
2025-11-14 17:41:30,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:30,602 - INFO - Going to convert document batch...
2025-11-14 17:41:30,603 - INFO - Processing document 4_2024-07-29


Converted 'data\edgar_documents\TMO\4_2024-06-05' --> 'data\processed_data\TMO\4_2024-06-05.md'
Converted 'data\edgar_documents\TMO\4_2024-07-02' --> 'data\processed_data\TMO\4_2024-07-02.md'


2025-11-14 17:41:30,654 - INFO - Finished converting document 4_2024-07-29 in 0.11 sec.
2025-11-14 17:41:30,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:30,749 - INFO - Going to convert document batch...
2025-11-14 17:41:30,750 - INFO - Processing document 4_2024-07-31


Converted 'data\edgar_documents\TMO\4_2024-07-29' --> 'data\processed_data\TMO\4_2024-07-29.md'


2025-11-14 17:41:30,883 - INFO - Finished converting document 4_2024-07-31 in 0.19 sec.
2025-11-14 17:41:30,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:31,007 - INFO - Going to convert document batch...
2025-11-14 17:41:31,008 - INFO - Processing document 4_2024-08-01
2025-11-14 17:41:31,072 - INFO - Finished converting document 4_2024-08-01 in 0.12 sec.


Converted 'data\edgar_documents\TMO\4_2024-07-31' --> 'data\processed_data\TMO\4_2024-07-31.md'
Converted 'data\edgar_documents\TMO\4_2024-08-01' --> 'data\processed_data\TMO\4_2024-08-01.md'


2025-11-14 17:41:31,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:31,193 - INFO - Going to convert document batch...
2025-11-14 17:41:31,195 - INFO - Processing document 4_2024-08-27
2025-11-14 17:41:31,257 - INFO - Finished converting document 4_2024-08-27 in 0.11 sec.
2025-11-14 17:41:31,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:31,350 - INFO - Going to convert document batch...
2025-11-14 17:41:31,352 - INFO - Processing document 4_2024-08-29
2025-11-14 17:41:31,393 - INFO - Finished converting document 4_2024-08-29 in 0.09 sec.
2025-11-14 17:41:31,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2024-08-27' --> 'data\processed_data\TMO\4_2024-08-27.md'
Converted 'data\edgar_documents\TMO\4_2024-08-29' --> 'data\processed_data\TMO\4_2024-08-29.md'


2025-11-14 17:41:31,563 - INFO - Going to convert document batch...
2025-11-14 17:41:31,565 - INFO - Processing document 4_2024-09-05
2025-11-14 17:41:31,797 - INFO - Finished converting document 4_2024-09-05 in 0.36 sec.
2025-11-14 17:41:31,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:31,910 - INFO - Going to convert document batch...
2025-11-14 17:41:31,910 - INFO - Processing document 4_2024-10-01
2025-11-14 17:41:31,946 - INFO - Finished converting document 4_2024-10-01 in 0.06 sec.
2025-11-14 17:41:32,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:32,038 - INFO - Going to convert document batch...
2025-11-14 17:41:32,039 - INFO - Processing document 4_2024-10-29


Converted 'data\edgar_documents\TMO\4_2024-09-05' --> 'data\processed_data\TMO\4_2024-09-05.md'
Converted 'data\edgar_documents\TMO\4_2024-10-01' --> 'data\processed_data\TMO\4_2024-10-01.md'


2025-11-14 17:41:32,085 - INFO - Finished converting document 4_2024-10-29 in 0.09 sec.
2025-11-14 17:41:32,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:32,222 - INFO - Going to convert document batch...
2025-11-14 17:41:32,223 - INFO - Processing document 4_2024-10-30
2025-11-14 17:41:32,331 - INFO - Finished converting document 4_2024-10-30 in 0.17 sec.


Converted 'data\edgar_documents\TMO\4_2024-10-29' --> 'data\processed_data\TMO\4_2024-10-29.md'


2025-11-14 17:41:32,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:32,446 - INFO - Going to convert document batch...
2025-11-14 17:41:32,447 - INFO - Processing document 4_2024-11-01
2025-11-14 17:41:32,528 - INFO - Finished converting document 4_2024-11-01 in 0.14 sec.


Converted 'data\edgar_documents\TMO\4_2024-10-30' --> 'data\processed_data\TMO\4_2024-10-30.md'


2025-11-14 17:41:32,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:32,687 - INFO - Going to convert document batch...
2025-11-14 17:41:32,688 - INFO - Processing document 4_2024-11-04
2025-11-14 17:41:32,772 - INFO - Finished converting document 4_2024-11-04 in 0.12 sec.


Converted 'data\edgar_documents\TMO\4_2024-11-01' --> 'data\processed_data\TMO\4_2024-11-01.md'
Converted 'data\edgar_documents\TMO\4_2024-11-04' --> 'data\processed_data\TMO\4_2024-11-04.md'


2025-11-14 17:41:32,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:32,905 - INFO - Going to convert document batch...
2025-11-14 17:41:32,907 - INFO - Processing document 4_2024-11-08
2025-11-14 17:41:33,018 - INFO - Finished converting document 4_2024-11-08 in 0.17 sec.
2025-11-14 17:41:33,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:33,127 - INFO - Going to convert document batch...
2025-11-14 17:41:33,128 - INFO - Processing document 4_2024-11-12
2025-11-14 17:41:33,183 - INFO - Finished converting document 4_2024-11-12 in 0.09 sec.
2025-11-14 17:41:33,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:33,295 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMO\4_2024-11-08' --> 'data\processed_data\TMO\4_2024-11-08.md'
Converted 'data\edgar_documents\TMO\4_2024-11-12' --> 'data\processed_data\TMO\4_2024-11-12.md'


2025-11-14 17:41:33,297 - INFO - Processing document 4_2024-12-04
2025-11-14 17:41:33,389 - INFO - Finished converting document 4_2024-12-04 in 0.16 sec.
2025-11-14 17:41:33,471 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:33,486 - INFO - Going to convert document batch...
2025-11-14 17:41:33,487 - INFO - Processing document 4_2024-12-09
2025-11-14 17:41:33,534 - INFO - Finished converting document 4_2024-12-09 in 0.08 sec.
2025-11-14 17:41:33,601 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:33,623 - INFO - Going to convert document batch...
2025-11-14 17:41:33,624 - INFO - Processing document 4_2025-01-02


Converted 'data\edgar_documents\TMO\4_2024-12-04' --> 'data\processed_data\TMO\4_2024-12-04.md'
Converted 'data\edgar_documents\TMO\4_2024-12-09' --> 'data\processed_data\TMO\4_2024-12-09.md'


2025-11-14 17:41:33,671 - INFO - Finished converting document 4_2025-01-02 in 0.09 sec.
2025-11-14 17:41:33,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:33,761 - INFO - Going to convert document batch...
2025-11-14 17:41:33,762 - INFO - Processing document 4_2025-02-05
2025-11-14 17:41:33,814 - INFO - Finished converting document 4_2025-02-05 in 0.11 sec.
2025-11-14 17:41:33,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\4_2025-01-02' --> 'data\processed_data\TMO\4_2025-01-02.md'
Converted 'data\edgar_documents\TMO\4_2025-02-05' --> 'data\processed_data\TMO\4_2025-02-05.md'


2025-11-14 17:41:33,902 - INFO - Going to convert document batch...
2025-11-14 17:41:33,903 - INFO - Processing document 4_2025-02-18
2025-11-14 17:41:33,943 - INFO - Finished converting document 4_2025-02-18 in 0.08 sec.
2025-11-14 17:41:33,993 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:34,011 - INFO - Going to convert document batch...
2025-11-14 17:41:34,013 - INFO - Processing document 4_2025-02-21
2025-11-14 17:41:34,057 - INFO - Finished converting document 4_2025-02-21 in 0.08 sec.
2025-11-14 17:41:34,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:34,158 - INFO - Going to convert document batch...
2025-11-14 17:41:34,161 - INFO - Processing document 4_2025-02-26


Converted 'data\edgar_documents\TMO\4_2025-02-18' --> 'data\processed_data\TMO\4_2025-02-18.md'
Converted 'data\edgar_documents\TMO\4_2025-02-21' --> 'data\processed_data\TMO\4_2025-02-21.md'


2025-11-14 17:41:34,218 - INFO - Finished converting document 4_2025-02-26 in 0.12 sec.
2025-11-14 17:41:34,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:34,346 - INFO - Going to convert document batch...
2025-11-14 17:41:34,351 - INFO - Processing document 4_2025-03-04
2025-11-14 17:41:34,424 - INFO - Finished converting document 4_2025-03-04 in 0.16 sec.


Converted 'data\edgar_documents\TMO\4_2025-02-26' --> 'data\processed_data\TMO\4_2025-02-26.md'


2025-11-14 17:41:34,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:34,524 - INFO - Going to convert document batch...
2025-11-14 17:41:34,525 - INFO - Processing document 4_2025-03-06
2025-11-14 17:41:34,637 - INFO - Finished converting document 4_2025-03-06 in 0.17 sec.


Converted 'data\edgar_documents\TMO\4_2025-03-04' --> 'data\processed_data\TMO\4_2025-03-04.md'


2025-11-14 17:41:34,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:34,753 - INFO - Going to convert document batch...
2025-11-14 17:41:34,755 - INFO - Processing document 4_2025-03-11
2025-11-14 17:41:34,812 - INFO - Finished converting document 4_2025-03-11 in 0.09 sec.
2025-11-14 17:41:34,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:34,877 - INFO - Going to convert document batch...
2025-11-14 17:41:34,878 - INFO - Processing document 4_2025-04-01


Converted 'data\edgar_documents\TMO\4_2025-03-06' --> 'data\processed_data\TMO\4_2025-03-06.md'
Converted 'data\edgar_documents\TMO\4_2025-03-11' --> 'data\processed_data\TMO\4_2025-03-11.md'


2025-11-14 17:41:34,914 - INFO - Finished converting document 4_2025-04-01 in 0.06 sec.
2025-11-14 17:41:34,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:34,979 - INFO - Going to convert document batch...
2025-11-14 17:41:34,980 - INFO - Processing document 4_2025-04-30
2025-11-14 17:41:35,017 - INFO - Finished converting document 4_2025-04-30 in 0.06 sec.
2025-11-14 17:41:35,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:35,082 - INFO - Going to convert document batch...
2025-11-14 17:41:35,084 - INFO - Processing document 4_2025-05-13
2025-11-14 17:41:35,121 - INFO - Finished converting document 4_2025-05-13 in 0.08 sec.


Converted 'data\edgar_documents\TMO\4_2025-04-01' --> 'data\processed_data\TMO\4_2025-04-01.md'
Converted 'data\edgar_documents\TMO\4_2025-04-30' --> 'data\processed_data\TMO\4_2025-04-30.md'


2025-11-14 17:41:35,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:35,249 - INFO - Going to convert document batch...
2025-11-14 17:41:35,251 - INFO - Processing document 4_2025-05-22
2025-11-14 17:41:35,315 - INFO - Finished converting document 4_2025-05-22 in 0.14 sec.


Converted 'data\edgar_documents\TMO\4_2025-05-13' --> 'data\processed_data\TMO\4_2025-05-13.md'


2025-11-14 17:41:35,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:35,414 - INFO - Going to convert document batch...
2025-11-14 17:41:35,415 - INFO - Processing document 4_2025-06-03


Converted 'data\edgar_documents\TMO\4_2025-05-22' --> 'data\processed_data\TMO\4_2025-05-22.md'


2025-11-14 17:41:35,847 - INFO - Finished converting document 4_2025-06-03 in 0.47 sec.
2025-11-14 17:41:35,932 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:35,961 - INFO - Going to convert document batch...
2025-11-14 17:41:35,963 - INFO - Processing document 4_2025-07-01
2025-11-14 17:41:35,997 - INFO - Finished converting document 4_2025-07-01 in 0.09 sec.
2025-11-14 17:41:36,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:36,075 - INFO - Going to convert document batch...
2025-11-14 17:41:36,076 - INFO - Processing document 4_2025-07-28


Converted 'data\edgar_documents\TMO\4_2025-06-03' --> 'data\processed_data\TMO\4_2025-06-03.md'
Converted 'data\edgar_documents\TMO\4_2025-07-01' --> 'data\processed_data\TMO\4_2025-07-01.md'


2025-11-14 17:41:36,113 - INFO - Finished converting document 4_2025-07-28 in 0.08 sec.
2025-11-14 17:41:36,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:36,240 - INFO - Going to convert document batch...
2025-11-14 17:41:36,241 - INFO - Processing document 4_2025-08-07


Converted 'data\edgar_documents\TMO\4_2025-07-28' --> 'data\processed_data\TMO\4_2025-07-28.md'


2025-11-14 17:41:36,350 - INFO - Finished converting document 4_2025-08-07 in 0.20 sec.
2025-11-14 17:41:36,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:36,476 - INFO - Going to convert document batch...
2025-11-14 17:41:36,477 - INFO - Processing document 4_2025-08-21
2025-11-14 17:41:36,532 - INFO - Finished converting document 4_2025-08-21 in 0.11 sec.
2025-11-14 17:41:36,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:36,614 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMO\4_2025-08-07' --> 'data\processed_data\TMO\4_2025-08-07.md'
Converted 'data\edgar_documents\TMO\4_2025-08-21' --> 'data\processed_data\TMO\4_2025-08-21.md'


2025-11-14 17:41:36,615 - INFO - Processing document 4_2025-08-26
2025-11-14 17:41:36,664 - INFO - Finished converting document 4_2025-08-26 in 0.08 sec.
2025-11-14 17:41:36,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:36,743 - INFO - Going to convert document batch...
2025-11-14 17:41:36,744 - INFO - Processing document 4_2025-09-02
2025-11-14 17:41:36,781 - INFO - Finished converting document 4_2025-09-02 in 0.08 sec.
2025-11-14 17:41:36,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:36,853 - INFO - Going to convert document batch...
2025-11-14 17:41:36,854 - INFO - Processing document 4_2025-09-09
2025-11-14 17:41:36,903 - INFO - Finished converting document 4_2025-09-09 in 0.09 sec.


Converted 'data\edgar_documents\TMO\4_2025-08-26' --> 'data\processed_data\TMO\4_2025-08-26.md'
Converted 'data\edgar_documents\TMO\4_2025-09-02' --> 'data\processed_data\TMO\4_2025-09-02.md'


2025-11-14 17:41:36,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:36,989 - INFO - Going to convert document batch...
2025-11-14 17:41:36,992 - INFO - Processing document 4_2025-09-30
2025-11-14 17:41:37,030 - INFO - Finished converting document 4_2025-09-30 in 0.09 sec.


Converted 'data\edgar_documents\TMO\4_2025-09-09' --> 'data\processed_data\TMO\4_2025-09-09.md'
Converted 'data\edgar_documents\TMO\4_2025-09-30' --> 'data\processed_data\TMO\4_2025-09-30.md'


2025-11-14 17:41:37,151 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:41:37,152 - ERROR - Input document 4_2025-10-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:41:37,157 - INFO - Going to convert document batch...
2025-11-14 17:41:37,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:37,185 - INFO - Going to convert document batch...
2025-11-14 17:41:37,186 - INFO - Processing document 4_2025-10-28
2025-11-14 17:41:37,216 - INFO - Fin

Error processing data\edgar_documents\TMO\4_2025-10-01: File format not allowed: data\edgar_documents\TMO\4_2025-10-01
Converted 'data\edgar_documents\TMO\4_2025-10-28' --> 'data\processed_data\TMO\4_2025-10-28.md'


2025-11-14 17:41:37,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:37,415 - INFO - Going to convert document batch...
2025-11-14 17:41:37,417 - INFO - Processing document 8-K_2023-02-01
2025-11-14 17:41:37,454 - INFO - Finished converting document 8-K_2023-02-01 in 0.09 sec.
2025-11-14 17:41:37,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:37,527 - INFO - Going to convert document batch...
2025-11-14 17:41:37,528 - INFO - Processing document 8-K_2023-04-26
2025-11-14 17:41:37,557 - INFO - Finished converting document 8-K_2023-04-26 in 0.09 sec.


Converted 'data\edgar_documents\TMO\4_2025-11-10' --> 'data\processed_data\TMO\4_2025-11-10.md'
Converted 'data\edgar_documents\TMO\8-K_2023-02-01' --> 'data\processed_data\TMO\8-K_2023-02-01.md'


2025-11-14 17:41:37,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:37,692 - INFO - Going to convert document batch...
2025-11-14 17:41:37,693 - INFO - Processing document 8-K_2023-05-26


Converted 'data\edgar_documents\TMO\8-K_2023-04-26' --> 'data\processed_data\TMO\8-K_2023-04-26.md'


2025-11-14 17:41:37,803 - INFO - Finished converting document 8-K_2023-05-26 in 0.20 sec.
2025-11-14 17:41:37,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:37,889 - INFO - Going to convert document batch...
2025-11-14 17:41:37,890 - INFO - Processing document 8-K_2023-07-13
2025-11-14 17:41:37,931 - INFO - Finished converting document 8-K_2023-07-13 in 0.09 sec.
2025-11-14 17:41:37,968 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:38,003 - INFO - Going to convert document batch...
2025-11-14 17:41:38,004 - INFO - Processing document 8-K_2023-07-26
2025-11-14 17:41:38,043 - INFO - Finished converting document 8-K_2023-07-26 in 0.09 sec.


Converted 'data\edgar_documents\TMO\8-K_2023-05-26' --> 'data\processed_data\TMO\8-K_2023-05-26.md'
Converted 'data\edgar_documents\TMO\8-K_2023-07-13' --> 'data\processed_data\TMO\8-K_2023-07-13.md'


2025-11-14 17:41:38,097 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:38,142 - INFO - Going to convert document batch...
2025-11-14 17:41:38,143 - INFO - Processing document 8-K_2023-08-08
2025-11-14 17:41:38,180 - INFO - Finished converting document 8-K_2023-08-08 in 0.09 sec.
2025-11-14 17:41:38,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\8-K_2023-07-26' --> 'data\processed_data\TMO\8-K_2023-07-26.md'
Converted 'data\edgar_documents\TMO\8-K_2023-08-08' --> 'data\processed_data\TMO\8-K_2023-08-08.md'


2025-11-14 17:41:38,270 - INFO - Going to convert document batch...
2025-11-14 17:41:38,271 - INFO - Processing document 8-K_2023-08-10
2025-11-14 17:41:38,334 - INFO - Finished converting document 8-K_2023-08-10 in 0.14 sec.
2025-11-14 17:41:38,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:38,431 - INFO - Going to convert document batch...
2025-11-14 17:41:38,432 - INFO - Processing document 8-K_2023-09-21
2025-11-14 17:41:38,477 - INFO - Finished converting document 8-K_2023-09-21 in 0.11 sec.
2025-11-14 17:41:38,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:38,546 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMO\8-K_2023-08-10' --> 'data\processed_data\TMO\8-K_2023-08-10.md'
Converted 'data\edgar_documents\TMO\8-K_2023-09-21' --> 'data\processed_data\TMO\8-K_2023-09-21.md'


2025-11-14 17:41:38,548 - INFO - Processing document 8-K_2023-10-17
2025-11-14 17:41:38,601 - INFO - Finished converting document 8-K_2023-10-17 in 0.09 sec.
2025-11-14 17:41:38,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:38,666 - INFO - Going to convert document batch...
2025-11-14 17:41:38,667 - INFO - Processing document 8-K_2023-10-25
2025-11-14 17:41:38,707 - INFO - Finished converting document 8-K_2023-10-25 in 0.08 sec.
2025-11-14 17:41:38,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:38,777 - INFO - Going to convert document batch...
2025-11-14 17:41:38,778 - INFO - Processing document 8-K_2023-11-07


Converted 'data\edgar_documents\TMO\8-K_2023-10-17' --> 'data\processed_data\TMO\8-K_2023-10-17.md'
Converted 'data\edgar_documents\TMO\8-K_2023-10-25' --> 'data\processed_data\TMO\8-K_2023-10-25.md'


2025-11-14 17:41:38,827 - INFO - Finished converting document 8-K_2023-11-07 in 0.11 sec.
2025-11-14 17:41:38,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:38,941 - INFO - Going to convert document batch...
2025-11-14 17:41:38,943 - INFO - Processing document 8-K_2023-12-05
2025-11-14 17:41:38,993 - INFO - Finished converting document 8-K_2023-12-05 in 0.12 sec.


Converted 'data\edgar_documents\TMO\8-K_2023-11-07' --> 'data\processed_data\TMO\8-K_2023-11-07.md'
Converted 'data\edgar_documents\TMO\8-K_2023-12-05' --> 'data\processed_data\TMO\8-K_2023-12-05.md'


2025-11-14 17:41:39,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:39,124 - INFO - Going to convert document batch...
2025-11-14 17:41:39,126 - INFO - Processing document 8-K_2024-01-31
2025-11-14 17:41:39,167 - INFO - Finished converting document 8-K_2024-01-31 in 0.12 sec.
2025-11-14 17:41:39,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:39,269 - INFO - Going to convert document batch...
2025-11-14 17:41:39,271 - INFO - Processing document 8-K_2024-04-24
2025-11-14 17:41:39,367 - INFO - Finished converting document 8-K_2024-04-24 in 0.17 sec.


Converted 'data\edgar_documents\TMO\8-K_2024-01-31' --> 'data\processed_data\TMO\8-K_2024-01-31.md'


2025-11-14 17:41:39,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:39,460 - INFO - Going to convert document batch...
2025-11-14 17:41:39,461 - INFO - Processing document 8-K_2024-05-24
2025-11-14 17:41:39,559 - INFO - Finished converting document 8-K_2024-05-24 in 0.17 sec.


Converted 'data\edgar_documents\TMO\8-K_2024-04-24' --> 'data\processed_data\TMO\8-K_2024-04-24.md'


2025-11-14 17:41:39,620 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:41:39,621 - ERROR - Input document 8-K_2024-07-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:41:39,622 - INFO - Going to convert document batch...
2025-11-14 17:41:39,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:39,694 - INFO - Going to convert document batch...
2025-11-14 17:41:39,696 - INFO - Processing document 8-K_2024-07

Converted 'data\edgar_documents\TMO\8-K_2024-05-24' --> 'data\processed_data\TMO\8-K_2024-05-24.md'
Error processing data\edgar_documents\TMO\8-K_2024-07-10: File format not allowed: data\edgar_documents\TMO\8-K_2024-07-10
Converted 'data\edgar_documents\TMO\8-K_2024-07-24' --> 'data\processed_data\TMO\8-K_2024-07-24.md'


2025-11-14 17:41:39,802 - INFO - Processing document 8-K_2024-10-23
2025-11-14 17:41:39,839 - INFO - Finished converting document 8-K_2024-10-23 in 0.09 sec.
2025-11-14 17:41:39,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:39,907 - INFO - Going to convert document batch...
2025-11-14 17:41:39,908 - INFO - Processing document 8-K_2025-01-30
2025-11-14 17:41:39,947 - INFO - Finished converting document 8-K_2025-01-30 in 0.08 sec.
2025-11-14 17:41:39,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:40,027 - INFO - Going to convert document batch...
2025-11-14 17:41:40,029 - INFO - Processing document 8-K_2025-02-19
2025-11-14 17:41:40,073 - INFO - Finished converting document 8-K_2025-02-19 in 0.11 sec.


Converted 'data\edgar_documents\TMO\8-K_2024-10-23' --> 'data\processed_data\TMO\8-K_2024-10-23.md'
Converted 'data\edgar_documents\TMO\8-K_2025-01-30' --> 'data\processed_data\TMO\8-K_2025-01-30.md'


2025-11-14 17:41:40,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:40,156 - INFO - Going to convert document batch...
2025-11-14 17:41:40,157 - INFO - Processing document 8-K_2025-02-25
2025-11-14 17:41:40,194 - INFO - Finished converting document 8-K_2025-02-25 in 0.09 sec.
2025-11-14 17:41:40,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:40,263 - INFO - Going to convert document batch...
2025-11-14 17:41:40,264 - INFO - Processing document 8-K_2025-04-23


Converted 'data\edgar_documents\TMO\8-K_2025-02-19' --> 'data\processed_data\TMO\8-K_2025-02-19.md'
Converted 'data\edgar_documents\TMO\8-K_2025-02-25' --> 'data\processed_data\TMO\8-K_2025-02-25.md'


2025-11-14 17:41:40,300 - INFO - Finished converting document 8-K_2025-04-23 in 0.09 sec.
2025-11-14 17:41:40,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:40,382 - INFO - Going to convert document batch...
2025-11-14 17:41:40,383 - INFO - Processing document 8-K_2025-05-22
2025-11-14 17:41:40,455 - INFO - Finished converting document 8-K_2025-05-22 in 0.12 sec.
2025-11-14 17:41:40,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\8-K_2025-04-23' --> 'data\processed_data\TMO\8-K_2025-04-23.md'
Converted 'data\edgar_documents\TMO\8-K_2025-05-22' --> 'data\processed_data\TMO\8-K_2025-05-22.md'


2025-11-14 17:41:40,590 - INFO - Going to convert document batch...
2025-11-14 17:41:40,591 - INFO - Processing document 8-K_2025-05-28
2025-11-14 17:41:40,664 - INFO - Finished converting document 8-K_2025-05-28 in 0.17 sec.
2025-11-14 17:41:40,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:40,742 - INFO - Going to convert document batch...
2025-11-14 17:41:40,743 - INFO - Processing document 8-K_2025-07-23
2025-11-14 17:41:40,776 - INFO - Finished converting document 8-K_2025-07-23 in 0.09 sec.
2025-11-14 17:41:40,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:40,839 - INFO - Going to convert document batch...
2025-11-14 17:41:40,840 - INFO - Processing document 8-K_2025-09-02
2025-11-14 17:41:40,879 - INFO - Finished converting document 8-K_2025-09-02 in 0.08 sec.


Converted 'data\edgar_documents\TMO\8-K_2025-05-28' --> 'data\processed_data\TMO\8-K_2025-05-28.md'
Converted 'data\edgar_documents\TMO\8-K_2025-07-23' --> 'data\processed_data\TMO\8-K_2025-07-23.md'


2025-11-14 17:41:40,916 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:41:40,917 - ERROR - Input document 8-K_2025-10-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:41:40,918 - INFO - Going to convert document batch...
2025-11-14 17:41:40,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:40,979 - INFO - Going to convert document batch...
2025-11-14 17:41:40,980 - INFO - Processing document 8-K_2025-10

Converted 'data\edgar_documents\TMO\8-K_2025-09-02' --> 'data\processed_data\TMO\8-K_2025-09-02.md'
Error processing data\edgar_documents\TMO\8-K_2025-10-07: File format not allowed: data\edgar_documents\TMO\8-K_2025-10-07
Converted 'data\edgar_documents\TMO\8-K_2025-10-22' --> 'data\processed_data\TMO\8-K_2025-10-22.md'


2025-11-14 17:41:41,110 - INFO - Going to convert document batch...
2025-11-14 17:41:41,112 - INFO - Processing document 8-K_2025-10-29
2025-11-14 17:41:41,164 - INFO - Finished converting document 8-K_2025-10-29 in 0.12 sec.
2025-11-14 17:41:41,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMO\8-K_2025-10-29' --> 'data\processed_data\TMO\8-K_2025-10-29.md'


2025-11-14 17:41:43,174 - INFO - Going to convert document batch...
2025-11-14 17:41:43,175 - INFO - Processing document DEF-14A_2023-04-07
2025-11-14 17:41:49,118 - INFO - Finished converting document DEF-14A_2023-04-07 in 7.92 sec.
2025-11-14 17:41:51,096 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:41:51,097 - ERROR - Input document DEF-14A_2024-04-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:41:51,100 - INFO - Going to 

Converted 'data\edgar_documents\TMO\DEF-14A_2023-04-07' --> 'data\processed_data\TMO\DEF-14A_2023-04-07.md'
Error processing data\edgar_documents\TMO\DEF-14A_2024-04-09: File format not allowed: data\edgar_documents\TMO\DEF-14A_2024-04-09
Error processing data\edgar_documents\TMO\DEF-14A_2025-04-08: File format not allowed: data\edgar_documents\TMO\DEF-14A_2025-04-08
Processed 127 new files. Errors: 8
Found 254 files to process in data\edgar_documents\TMUS


2025-11-14 17:41:51,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:41:54,893 - INFO - Going to convert document batch...
2025-11-14 17:41:54,895 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:41:54,896 - INFO - Processing document 10-K_2023-02-14
2025-11-14 17:42:05,264 - INFO - Finished converting document 10-K_2023-02-14 in 13.69 sec.
2025-11-14 17:42:09,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-K_2023-02-14' --> 'data\processed_data\TMUS\10-K_2023-02-14.md'


2025-11-14 17:42:13,891 - INFO - Going to convert document batch...
2025-11-14 17:42:13,893 - INFO - Processing document 10-K_2024-02-02
2025-11-14 17:42:25,443 - INFO - Finished converting document 10-K_2024-02-02 in 15.56 sec.
2025-11-14 17:42:29,176 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-K_2024-02-02' --> 'data\processed_data\TMUS\10-K_2024-02-02.md'


2025-11-14 17:42:33,780 - INFO - Going to convert document batch...
2025-11-14 17:42:33,782 - INFO - Processing document 10-K_2025-01-31
2025-11-14 17:42:46,882 - INFO - Finished converting document 10-K_2025-01-31 in 17.81 sec.
2025-11-14 17:42:50,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-K_2025-01-31' --> 'data\processed_data\TMUS\10-K_2025-01-31.md'


2025-11-14 17:42:52,488 - INFO - Going to convert document batch...
2025-11-14 17:42:52,490 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 17:42:57,662 - INFO - Finished converting document 10-Q_2023-04-27 in 7.03 sec.
2025-11-14 17:42:59,707 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-Q_2023-04-27' --> 'data\processed_data\TMUS\10-Q_2023-04-27.md'


2025-11-14 17:43:01,606 - INFO - Going to convert document batch...
2025-11-14 17:43:01,607 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 17:43:07,454 - INFO - Finished converting document 10-Q_2023-07-27 in 7.83 sec.
2025-11-14 17:43:10,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-Q_2023-07-27' --> 'data\processed_data\TMUS\10-Q_2023-07-27.md'


2025-11-14 17:43:13,422 - INFO - Going to convert document batch...
2025-11-14 17:43:13,423 - INFO - Processing document 10-Q_2023-10-25
2025-11-14 17:43:18,023 - INFO - Finished converting document 10-Q_2023-10-25 in 7.89 sec.
2025-11-14 17:43:20,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-Q_2023-10-25' --> 'data\processed_data\TMUS\10-Q_2023-10-25.md'


2025-11-14 17:43:23,276 - INFO - Going to convert document batch...
2025-11-14 17:43:23,277 - INFO - Processing document 10-Q_2024-04-26
2025-11-14 17:43:27,017 - INFO - Finished converting document 10-Q_2024-04-26 in 6.25 sec.
2025-11-14 17:43:29,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-Q_2024-04-26' --> 'data\processed_data\TMUS\10-Q_2024-04-26.md'


2025-11-14 17:43:32,846 - INFO - Going to convert document batch...
2025-11-14 17:43:32,848 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 17:43:37,432 - INFO - Finished converting document 10-Q_2024-07-31 in 7.50 sec.
2025-11-14 17:43:40,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-Q_2024-07-31' --> 'data\processed_data\TMUS\10-Q_2024-07-31.md'


2025-11-14 17:43:43,293 - INFO - Going to convert document batch...
2025-11-14 17:43:43,295 - INFO - Processing document 10-Q_2024-10-23
2025-11-14 17:43:48,212 - INFO - Finished converting document 10-Q_2024-10-23 in 8.27 sec.
2025-11-14 17:43:52,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-Q_2024-10-23' --> 'data\processed_data\TMUS\10-Q_2024-10-23.md'


2025-11-14 17:43:54,181 - INFO - Going to convert document batch...
2025-11-14 17:43:54,184 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 17:43:59,124 - INFO - Finished converting document 10-Q_2025-04-24 in 6.98 sec.
2025-11-14 17:44:01,206 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-Q_2025-04-24' --> 'data\processed_data\TMUS\10-Q_2025-04-24.md'


2025-11-14 17:44:03,885 - INFO - Going to convert document batch...
2025-11-14 17:44:03,886 - INFO - Processing document 10-Q_2025-07-23
2025-11-14 17:44:07,816 - INFO - Finished converting document 10-Q_2025-07-23 in 6.66 sec.
2025-11-14 17:44:09,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\10-Q_2025-07-23' --> 'data\processed_data\TMUS\10-Q_2025-07-23.md'


2025-11-14 17:44:12,942 - INFO - Going to convert document batch...
2025-11-14 17:44:12,944 - INFO - Processing document 10-Q_2025-10-23
2025-11-14 17:44:18,400 - INFO - Finished converting document 10-Q_2025-10-23 in 8.52 sec.
2025-11-14 17:44:22,460 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:22,461 - ERROR - Input document 4_2023-02-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:44:22,465 - INFO - Going to convert document batch...
2025-11-14 17:44:22,49

Converted 'data\edgar_documents\TMUS\10-Q_2025-10-23' --> 'data\processed_data\TMUS\10-Q_2025-10-23.md'
Error processing data\edgar_documents\TMUS\4_2023-02-06: File format not allowed: data\edgar_documents\TMUS\4_2023-02-06
Error processing data\edgar_documents\TMUS\4_2023-02-08: File format not allowed: data\edgar_documents\TMUS\4_2023-02-08


2025-11-14 17:44:22,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:22,774 - INFO - Going to convert document batch...
2025-11-14 17:44:22,776 - INFO - Processing document 4_2023-02-22
2025-11-14 17:44:22,861 - INFO - Finished converting document 4_2023-02-22 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2023-02-17' --> 'data\processed_data\TMUS\4_2023-02-17.md'


2025-11-14 17:44:22,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:22,966 - INFO - Going to convert document batch...
2025-11-14 17:44:22,968 - INFO - Processing document 4_2023-02-24
2025-11-14 17:44:23,031 - INFO - Finished converting document 4_2023-02-24 in 0.11 sec.
2025-11-14 17:44:23,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2023-02-22' --> 'data\processed_data\TMUS\4_2023-02-22.md'
Converted 'data\edgar_documents\TMUS\4_2023-02-24' --> 'data\processed_data\TMUS\4_2023-02-24.md'


2025-11-14 17:44:23,142 - INFO - Going to convert document batch...
2025-11-14 17:44:23,144 - INFO - Processing document 4_2023-03-01
2025-11-14 17:44:23,183 - INFO - Finished converting document 4_2023-03-01 in 0.11 sec.
2025-11-14 17:44:23,257 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:23,276 - INFO - Going to convert document batch...
2025-11-14 17:44:23,278 - INFO - Processing document 4_2023-03-07
2025-11-14 17:44:23,313 - INFO - Finished converting document 4_2023-03-07 in 0.08 sec.
2025-11-14 17:44:23,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:23,400 - INFO - Going to convert document batch...
2025-11-14 17:44:23,403 - INFO - Processing document 4_2023-03-15


Converted 'data\edgar_documents\TMUS\4_2023-03-01' --> 'data\processed_data\TMUS\4_2023-03-01.md'
Converted 'data\edgar_documents\TMUS\4_2023-03-07' --> 'data\processed_data\TMUS\4_2023-03-07.md'


2025-11-14 17:44:23,464 - INFO - Finished converting document 4_2023-03-15 in 0.12 sec.
2025-11-14 17:44:23,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:23,582 - INFO - Going to convert document batch...
2025-11-14 17:44:23,584 - INFO - Processing document 4_2023-04-04
2025-11-14 17:44:23,629 - INFO - Finished converting document 4_2023-04-04 in 0.09 sec.


Converted 'data\edgar_documents\TMUS\4_2023-03-15' --> 'data\processed_data\TMUS\4_2023-03-15.md'
Converted 'data\edgar_documents\TMUS\4_2023-04-04' --> 'data\processed_data\TMUS\4_2023-04-04.md'


2025-11-14 17:44:23,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:23,747 - INFO - Going to convert document batch...
2025-11-14 17:44:23,749 - INFO - Processing document 4_2023-04-07
2025-11-14 17:44:23,827 - INFO - Finished converting document 4_2023-04-07 in 0.14 sec.
2025-11-14 17:44:23,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:23,956 - INFO - Going to convert document batch...
2025-11-14 17:44:23,959 - INFO - Processing document 4_2023-04-12
2025-11-14 17:44:24,027 - INFO - Finished converting document 4_2023-04-12 in 0.12 sec.


Converted 'data\edgar_documents\TMUS\4_2023-04-07' --> 'data\processed_data\TMUS\4_2023-04-07.md'
Converted 'data\edgar_documents\TMUS\4_2023-04-12' --> 'data\processed_data\TMUS\4_2023-04-12.md'


2025-11-14 17:44:24,194 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:24,196 - ERROR - Input document 4_2023-05-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:44:24,199 - INFO - Going to convert document batch...
2025-11-14 17:44:24,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:24,252 - INFO - Going to convert document batch...
2025-11-14 17:44:24,254 - INFO - Processing document 4_2023-05-09
2025-11-14 17:44:24,327 - INFO - Fin

Error processing data\edgar_documents\TMUS\4_2023-05-08: File format not allowed: data\edgar_documents\TMUS\4_2023-05-08
Converted 'data\edgar_documents\TMUS\4_2023-05-09' --> 'data\processed_data\TMUS\4_2023-05-09.md'


2025-11-14 17:44:24,413 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:24,414 - ERROR - Input document 4_2023-05-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:44:24,416 - INFO - Going to convert document batch...
2025-11-14 17:44:24,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:24,448 - INFO - Going to convert document batch...
2025-11-14 17:44:24,450 - INFO - Processing document 4_2023-05-15
2025-11-14 17:44:24,487 - INFO - Fin

Error processing data\edgar_documents\TMUS\4_2023-05-10: File format not allowed: data\edgar_documents\TMUS\4_2023-05-10
Converted 'data\edgar_documents\TMUS\4_2023-05-15' --> 'data\processed_data\TMUS\4_2023-05-15.md'


2025-11-14 17:44:24,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:24,763 - INFO - Going to convert document batch...
2025-11-14 17:44:24,765 - INFO - Processing document 4_2023-05-23
2025-11-14 17:44:24,818 - INFO - Finished converting document 4_2023-05-23 in 0.09 sec.
2025-11-14 17:44:24,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2023-05-17' --> 'data\processed_data\TMUS\4_2023-05-17.md'
Converted 'data\edgar_documents\TMUS\4_2023-05-23' --> 'data\processed_data\TMUS\4_2023-05-23.md'


2025-11-14 17:44:24,945 - INFO - Going to convert document batch...
2025-11-14 17:44:24,947 - INFO - Processing document 4_2023-05-31
2025-11-14 17:44:25,020 - INFO - Finished converting document 4_2023-05-31 in 0.12 sec.
2025-11-14 17:44:25,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:25,132 - INFO - Going to convert document batch...
2025-11-14 17:44:25,133 - INFO - Processing document 4_2023-06-14
2025-11-14 17:44:25,176 - INFO - Finished converting document 4_2023-06-14 in 0.08 sec.
2025-11-14 17:44:25,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:25,276 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMUS\4_2023-05-31' --> 'data\processed_data\TMUS\4_2023-05-31.md'
Converted 'data\edgar_documents\TMUS\4_2023-06-14' --> 'data\processed_data\TMUS\4_2023-06-14.md'


2025-11-14 17:44:25,277 - INFO - Processing document 4_2023-06-21
2025-11-14 17:44:25,319 - INFO - Finished converting document 4_2023-06-21 in 0.09 sec.
2025-11-14 17:44:25,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:25,398 - INFO - Going to convert document batch...
2025-11-14 17:44:25,400 - INFO - Processing document 4_2023-07-05
2025-11-14 17:44:25,443 - INFO - Finished converting document 4_2023-07-05 in 0.08 sec.
2025-11-14 17:44:25,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:25,527 - INFO - Going to convert document batch...
2025-11-14 17:44:25,529 - INFO - Processing document 4_2023-07-12
2025-11-14 17:44:25,569 - INFO - Finished converting document 4_2023-07-12 in 0.08 sec.


Converted 'data\edgar_documents\TMUS\4_2023-06-21' --> 'data\processed_data\TMUS\4_2023-06-21.md'
Converted 'data\edgar_documents\TMUS\4_2023-07-05' --> 'data\processed_data\TMUS\4_2023-07-05.md'


2025-11-14 17:44:25,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:25,677 - INFO - Going to convert document batch...
2025-11-14 17:44:25,682 - INFO - Processing document 4_2023-07-20
2025-11-14 17:44:25,731 - INFO - Finished converting document 4_2023-07-20 in 0.12 sec.
2025-11-14 17:44:25,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:25,801 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMUS\4_2023-07-12' --> 'data\processed_data\TMUS\4_2023-07-12.md'
Converted 'data\edgar_documents\TMUS\4_2023-07-20' --> 'data\processed_data\TMUS\4_2023-07-20.md'


2025-11-14 17:44:25,802 - INFO - Processing document 4_2023-07-24
2025-11-14 17:44:25,839 - INFO - Finished converting document 4_2023-07-24 in 0.08 sec.
2025-11-14 17:44:25,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:25,910 - INFO - Going to convert document batch...
2025-11-14 17:44:25,911 - INFO - Processing document 4_2023-08-14
2025-11-14 17:44:25,952 - INFO - Finished converting document 4_2023-08-14 in 0.08 sec.
2025-11-14 17:44:26,028 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:26,029 - ERROR - Input document 4_2023-09-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\TMUS\4_2023-07-24' --> 'data\processed_data\TMUS\4_2023-07-24.md'
Converted 'data\edgar_documents\TMUS\4_2023-08-14' --> 'data\processed_data\TMUS\4_2023-08-14.md'
Error processing data\edgar_documents\TMUS\4_2023-09-11: File format not allowed: data\edgar_documents\TMUS\4_2023-09-11


2025-11-14 17:44:26,071 - INFO - Processing document 4_2023-09-13
2025-11-14 17:44:26,111 - INFO - Finished converting document 4_2023-09-13 in 0.08 sec.
2025-11-14 17:44:26,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:26,183 - INFO - Going to convert document batch...
2025-11-14 17:44:26,185 - INFO - Processing document 4_2023-09-15
2025-11-14 17:44:26,221 - INFO - Finished converting document 4_2023-09-15 in 0.06 sec.
2025-11-14 17:44:26,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:26,286 - INFO - Going to convert document batch...
2025-11-14 17:44:26,287 - INFO - Processing document 4_2023-11-03
2025-11-14 17:44:26,327 - INFO - Finished converting document 4_2023-11-03 in 0.08 sec.


Converted 'data\edgar_documents\TMUS\4_2023-09-13' --> 'data\processed_data\TMUS\4_2023-09-13.md'
Converted 'data\edgar_documents\TMUS\4_2023-09-15' --> 'data\processed_data\TMUS\4_2023-09-15.md'


2025-11-14 17:44:26,373 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:26,390 - INFO - Going to convert document batch...
2025-11-14 17:44:26,391 - INFO - Processing document 4_2023-11-14
2025-11-14 17:44:26,432 - INFO - Finished converting document 4_2023-11-14 in 0.08 sec.
2025-11-14 17:44:26,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:26,511 - INFO - Going to convert document batch...
2025-11-14 17:44:26,512 - INFO - Processing document 4_2023-11-21
2025-11-14 17:44:26,543 - INFO - Finished converting document 4_2023-11-21 in 0.08 sec.


Converted 'data\edgar_documents\TMUS\4_2023-11-03' --> 'data\processed_data\TMUS\4_2023-11-03.md'
Converted 'data\edgar_documents\TMUS\4_2023-11-14' --> 'data\processed_data\TMUS\4_2023-11-14.md'


2025-11-14 17:44:26,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:26,614 - INFO - Going to convert document batch...
2025-11-14 17:44:26,615 - INFO - Processing document 4_2023-11-28
2025-11-14 17:44:26,660 - INFO - Finished converting document 4_2023-11-28 in 0.08 sec.
2025-11-14 17:44:26,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:26,739 - INFO - Going to convert document batch...
2025-11-14 17:44:26,742 - INFO - Processing document 4_2023-12-13
2025-11-14 17:44:26,781 - INFO - Finished converting document 4_2023-12-13 in 0.09 sec.


Converted 'data\edgar_documents\TMUS\4_2023-11-21' --> 'data\processed_data\TMUS\4_2023-11-21.md'
Converted 'data\edgar_documents\TMUS\4_2023-11-28' --> 'data\processed_data\TMUS\4_2023-11-28.md'


2025-11-14 17:44:26,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:26,861 - INFO - Going to convert document batch...
2025-11-14 17:44:26,863 - INFO - Processing document 4_2023-12-15
2025-11-14 17:44:26,962 - INFO - Finished converting document 4_2023-12-15 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\4_2023-12-13' --> 'data\processed_data\TMUS\4_2023-12-13.md'


2025-11-14 17:44:27,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:27,114 - INFO - Going to convert document batch...
2025-11-14 17:44:27,115 - INFO - Processing document 4_2024-01-04
2025-11-14 17:44:27,205 - INFO - Finished converting document 4_2024-01-04 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2023-12-15' --> 'data\processed_data\TMUS\4_2023-12-15.md'


2025-11-14 17:44:27,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:27,370 - INFO - Going to convert document batch...
2025-11-14 17:44:27,372 - INFO - Processing document 4_2024-01-09


Converted 'data\edgar_documents\TMUS\4_2024-01-04' --> 'data\processed_data\TMUS\4_2024-01-04.md'


2025-11-14 17:44:27,534 - INFO - Finished converting document 4_2024-01-09 in 0.25 sec.
2025-11-14 17:44:27,640 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:27,641 - ERROR - Input document 4_2024-01-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:44:27,643 - INFO - Going to convert document batch...
2025-11-14 17:44:27,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:27,694 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\TMUS\4_2024-01-09' --> 'data\processed_data\TMUS\4_2024-01-09.md'
Error processing data\edgar_documents\TMUS\4_2024-01-11: File format not allowed: data\edgar_documents\TMUS\4_2024-01-11


2025-11-14 17:44:27,793 - INFO - Finished converting document 4_2024-01-12 in 0.16 sec.
2025-11-14 17:44:27,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:27,937 - INFO - Going to convert document batch...
2025-11-14 17:44:27,939 - INFO - Processing document 4_2024-01-18
2025-11-14 17:44:28,063 - INFO - Finished converting document 4_2024-01-18 in 0.20 sec.


Converted 'data\edgar_documents\TMUS\4_2024-01-12' --> 'data\processed_data\TMUS\4_2024-01-12.md'


2025-11-14 17:44:28,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:28,223 - INFO - Going to convert document batch...
2025-11-14 17:44:28,225 - INFO - Processing document 4_2024-01-23


Converted 'data\edgar_documents\TMUS\4_2024-01-18' --> 'data\processed_data\TMUS\4_2024-01-18.md'


2025-11-14 17:44:28,345 - INFO - Finished converting document 4_2024-01-23 in 0.20 sec.
2025-11-14 17:44:28,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:28,581 - INFO - Going to convert document batch...
2025-11-14 17:44:28,584 - INFO - Processing document 4_2024-01-26


Converted 'data\edgar_documents\TMUS\4_2024-01-23' --> 'data\processed_data\TMUS\4_2024-01-23.md'


2025-11-14 17:44:28,714 - INFO - Finished converting document 4_2024-01-26 in 0.30 sec.
2025-11-14 17:44:28,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:28,844 - INFO - Going to convert document batch...
2025-11-14 17:44:28,845 - INFO - Processing document 4_2024-01-30


Converted 'data\edgar_documents\TMUS\4_2024-01-26' --> 'data\processed_data\TMUS\4_2024-01-26.md'


2025-11-14 17:44:29,027 - INFO - Finished converting document 4_2024-01-30 in 0.25 sec.
2025-11-14 17:44:29,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:29,249 - INFO - Going to convert document batch...
2025-11-14 17:44:29,250 - INFO - Processing document 4_2024-02-02
2025-11-14 17:44:29,349 - INFO - Finished converting document 4_2024-02-02 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\4_2024-01-30' --> 'data\processed_data\TMUS\4_2024-01-30.md'


2025-11-14 17:44:29,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:29,467 - INFO - Going to convert document batch...
2025-11-14 17:44:29,469 - INFO - Processing document 4_2024-02-06
2025-11-14 17:44:29,559 - INFO - Finished converting document 4_2024-02-06 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\4_2024-02-02' --> 'data\processed_data\TMUS\4_2024-02-02.md'


2025-11-14 17:44:29,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:29,670 - INFO - Going to convert document batch...
2025-11-14 17:44:29,672 - INFO - Processing document 4_2024-02-07
2025-11-14 17:44:29,746 - INFO - Finished converting document 4_2024-02-07 in 0.12 sec.
2025-11-14 17:44:29,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2024-02-06' --> 'data\processed_data\TMUS\4_2024-02-06.md'
Converted 'data\edgar_documents\TMUS\4_2024-02-07' --> 'data\processed_data\TMUS\4_2024-02-07.md'


2025-11-14 17:44:29,865 - INFO - Going to convert document batch...
2025-11-14 17:44:29,866 - INFO - Processing document 4_2024-02-09
2025-11-14 17:44:29,987 - INFO - Finished converting document 4_2024-02-09 in 0.19 sec.
2025-11-14 17:44:30,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:30,131 - INFO - Going to convert document batch...
2025-11-14 17:44:30,132 - INFO - Processing document 4_2024-02-13
2025-11-14 17:44:30,242 - INFO - Finished converting document 4_2024-02-13 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2024-02-09' --> 'data\processed_data\TMUS\4_2024-02-09.md'


2025-11-14 17:44:30,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:30,413 - INFO - Going to convert document batch...
2025-11-14 17:44:30,414 - INFO - Processing document 4_2024-02-16
2025-11-14 17:44:30,511 - INFO - Finished converting document 4_2024-02-16 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\4_2024-02-13' --> 'data\processed_data\TMUS\4_2024-02-13.md'


2025-11-14 17:44:30,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:30,623 - INFO - Going to convert document batch...
2025-11-14 17:44:30,624 - INFO - Processing document 4_2024-02-20
2025-11-14 17:44:30,721 - INFO - Finished converting document 4_2024-02-20 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\4_2024-02-16' --> 'data\processed_data\TMUS\4_2024-02-16.md'


2025-11-14 17:44:30,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:30,854 - INFO - Going to convert document batch...
2025-11-14 17:44:30,855 - INFO - Processing document 4_2024-02-23
2025-11-14 17:44:30,935 - INFO - Finished converting document 4_2024-02-23 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\4_2024-02-20' --> 'data\processed_data\TMUS\4_2024-02-20.md'


2025-11-14 17:44:31,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:31,129 - INFO - Going to convert document batch...
2025-11-14 17:44:31,131 - INFO - Processing document 4_2024-02-27


Converted 'data\edgar_documents\TMUS\4_2024-02-23' --> 'data\processed_data\TMUS\4_2024-02-23.md'


2025-11-14 17:44:32,542 - INFO - Finished converting document 4_2024-02-27 in 1.50 sec.
2025-11-14 17:44:32,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:32,691 - INFO - Going to convert document batch...
2025-11-14 17:44:32,692 - INFO - Processing document 4_2024-02-29
2025-11-14 17:44:32,733 - INFO - Finished converting document 4_2024-02-29 in 0.08 sec.
2025-11-14 17:44:32,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:32,817 - INFO - Going to convert document batch...
2025-11-14 17:44:32,818 - INFO - Processing document 4_2024-03-01


Converted 'data\edgar_documents\TMUS\4_2024-02-27' --> 'data\processed_data\TMUS\4_2024-02-27.md'
Converted 'data\edgar_documents\TMUS\4_2024-02-29' --> 'data\processed_data\TMUS\4_2024-02-29.md'


2025-11-14 17:44:32,937 - INFO - Finished converting document 4_2024-03-01 in 0.17 sec.
2025-11-14 17:44:33,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:33,050 - INFO - Going to convert document batch...
2025-11-14 17:44:33,051 - INFO - Processing document 4_2024-03-05
2025-11-14 17:44:33,142 - INFO - Finished converting document 4_2024-03-05 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\4_2024-03-01' --> 'data\processed_data\TMUS\4_2024-03-01.md'


2025-11-14 17:44:33,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:33,288 - INFO - Going to convert document batch...
2025-11-14 17:44:33,289 - INFO - Processing document 4_2024-03-06
2025-11-14 17:44:33,345 - INFO - Finished converting document 4_2024-03-06 in 0.11 sec.
2025-11-14 17:44:33,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2024-03-05' --> 'data\processed_data\TMUS\4_2024-03-05.md'
Converted 'data\edgar_documents\TMUS\4_2024-03-06' --> 'data\processed_data\TMUS\4_2024-03-06.md'


2025-11-14 17:44:33,441 - INFO - Going to convert document batch...
2025-11-14 17:44:33,443 - INFO - Processing document 4_2024-03-08
2025-11-14 17:44:33,536 - INFO - Finished converting document 4_2024-03-08 in 0.14 sec.
2025-11-14 17:44:33,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:33,658 - INFO - Going to convert document batch...
2025-11-14 17:44:33,659 - INFO - Processing document 4_2024-03-11


Converted 'data\edgar_documents\TMUS\4_2024-03-08' --> 'data\processed_data\TMUS\4_2024-03-08.md'


2025-11-14 17:44:33,800 - INFO - Finished converting document 4_2024-03-11 in 0.19 sec.
2025-11-14 17:44:33,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:33,994 - INFO - Going to convert document batch...
2025-11-14 17:44:33,995 - INFO - Processing document 4_2024-03-14
2025-11-14 17:44:34,111 - INFO - Finished converting document 4_2024-03-14 in 0.19 sec.


Converted 'data\edgar_documents\TMUS\4_2024-03-11' --> 'data\processed_data\TMUS\4_2024-03-11.md'


2025-11-14 17:44:34,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:34,265 - INFO - Going to convert document batch...
2025-11-14 17:44:34,267 - INFO - Processing document 4_2024-03-19


Converted 'data\edgar_documents\TMUS\4_2024-03-14' --> 'data\processed_data\TMUS\4_2024-03-14.md'


2025-11-14 17:44:34,389 - INFO - Finished converting document 4_2024-03-19 in 0.20 sec.
2025-11-14 17:44:34,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:34,540 - INFO - Going to convert document batch...
2025-11-14 17:44:34,541 - INFO - Processing document 4_2024-03-21
2025-11-14 17:44:34,642 - INFO - Finished converting document 4_2024-03-21 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2024-03-19' --> 'data\processed_data\TMUS\4_2024-03-19.md'


2025-11-14 17:44:34,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:34,885 - INFO - Going to convert document batch...
2025-11-14 17:44:34,889 - INFO - Processing document 4_2024-03-26


Converted 'data\edgar_documents\TMUS\4_2024-03-21' --> 'data\processed_data\TMUS\4_2024-03-21.md'


2025-11-14 17:44:35,011 - INFO - Finished converting document 4_2024-03-26 in 0.28 sec.
2025-11-14 17:44:35,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:35,127 - INFO - Going to convert document batch...
2025-11-14 17:44:35,128 - INFO - Processing document 4_2024-03-28
2025-11-14 17:44:35,254 - INFO - Finished converting document 4_2024-03-28 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\4_2024-03-26' --> 'data\processed_data\TMUS\4_2024-03-26.md'


2025-11-14 17:44:35,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:35,389 - INFO - Going to convert document batch...
2025-11-14 17:44:35,390 - INFO - Processing document 4_2024-04-02
2025-11-14 17:44:35,471 - INFO - Finished converting document 4_2024-04-02 in 0.12 sec.


Converted 'data\edgar_documents\TMUS\4_2024-03-28' --> 'data\processed_data\TMUS\4_2024-03-28.md'


2025-11-14 17:44:35,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:35,625 - INFO - Going to convert document batch...
2025-11-14 17:44:35,626 - INFO - Processing document 4_2024-04-04
2025-11-14 17:44:35,736 - INFO - Finished converting document 4_2024-04-04 in 0.19 sec.


Converted 'data\edgar_documents\TMUS\4_2024-04-02' --> 'data\processed_data\TMUS\4_2024-04-02.md'


2025-11-14 17:44:35,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:35,895 - INFO - Going to convert document batch...
2025-11-14 17:44:35,896 - INFO - Processing document 4_2024-04-09
2025-11-14 17:44:35,982 - INFO - Finished converting document 4_2024-04-09 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\4_2024-04-04' --> 'data\processed_data\TMUS\4_2024-04-04.md'


2025-11-14 17:44:36,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:36,162 - INFO - Going to convert document batch...
2025-11-14 17:44:36,163 - INFO - Processing document 4_2024-04-11


Converted 'data\edgar_documents\TMUS\4_2024-04-09' --> 'data\processed_data\TMUS\4_2024-04-09.md'


2025-11-14 17:44:36,384 - INFO - Finished converting document 4_2024-04-11 in 0.30 sec.
2025-11-14 17:44:36,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:36,502 - INFO - Going to convert document batch...
2025-11-14 17:44:36,503 - INFO - Processing document 4_2024-04-16
2025-11-14 17:44:36,624 - INFO - Finished converting document 4_2024-04-16 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\4_2024-04-11' --> 'data\processed_data\TMUS\4_2024-04-11.md'


2025-11-14 17:44:36,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:36,754 - INFO - Going to convert document batch...
2025-11-14 17:44:36,755 - INFO - Processing document 4_2024-04-18
2025-11-14 17:44:36,828 - INFO - Finished converting document 4_2024-04-18 in 0.12 sec.


Converted 'data\edgar_documents\TMUS\4_2024-04-16' --> 'data\processed_data\TMUS\4_2024-04-16.md'


2025-11-14 17:44:36,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:37,000 - INFO - Going to convert document batch...
2025-11-14 17:44:37,002 - INFO - Processing document 4_2024-04-23


Converted 'data\edgar_documents\TMUS\4_2024-04-18' --> 'data\processed_data\TMUS\4_2024-04-18.md'


2025-11-14 17:44:37,143 - INFO - Finished converting document 4_2024-04-23 in 0.22 sec.
2025-11-14 17:44:37,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:37,301 - INFO - Going to convert document batch...
2025-11-14 17:44:37,302 - INFO - Processing document 4_2024-04-26


Converted 'data\edgar_documents\TMUS\4_2024-04-23' --> 'data\processed_data\TMUS\4_2024-04-23.md'


2025-11-14 17:44:37,425 - INFO - Finished converting document 4_2024-04-26 in 0.19 sec.
2025-11-14 17:44:37,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:37,640 - INFO - Going to convert document batch...
2025-11-14 17:44:37,642 - INFO - Processing document 4_2024-04-30


Converted 'data\edgar_documents\TMUS\4_2024-04-26' --> 'data\processed_data\TMUS\4_2024-04-26.md'


2025-11-14 17:44:37,784 - INFO - Finished converting document 4_2024-04-30 in 0.23 sec.
2025-11-14 17:44:37,938 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:37,939 - ERROR - Input document 4_2024-05-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:44:37,941 - INFO - Going to convert document batch...
2025-11-14 17:44:37,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:37,994 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\TMUS\4_2024-04-30' --> 'data\processed_data\TMUS\4_2024-04-30.md'
Error processing data\edgar_documents\TMUS\4_2024-05-02: File format not allowed: data\edgar_documents\TMUS\4_2024-05-02


2025-11-14 17:44:38,126 - INFO - Finished converting document 4_2024-05-03 in 0.19 sec.
2025-11-14 17:44:38,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:38,330 - INFO - Going to convert document batch...
2025-11-14 17:44:38,337 - INFO - Processing document 4_2024-05-07


Converted 'data\edgar_documents\TMUS\4_2024-05-03' --> 'data\processed_data\TMUS\4_2024-05-03.md'


2025-11-14 17:44:38,494 - INFO - Finished converting document 4_2024-05-07 in 0.23 sec.
2025-11-14 17:44:38,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:38,688 - INFO - Going to convert document batch...
2025-11-14 17:44:38,689 - INFO - Processing document 4_2024-05-09


Converted 'data\edgar_documents\TMUS\4_2024-05-07' --> 'data\processed_data\TMUS\4_2024-05-07.md'


2025-11-14 17:44:39,396 - INFO - Finished converting document 4_2024-05-09 in 0.77 sec.
2025-11-14 17:44:39,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:39,553 - INFO - Going to convert document batch...
2025-11-14 17:44:39,554 - INFO - Processing document 4_2024-05-14
2025-11-14 17:44:39,647 - INFO - Finished converting document 4_2024-05-14 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\4_2024-05-09' --> 'data\processed_data\TMUS\4_2024-05-09.md'


2025-11-14 17:44:39,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:39,805 - INFO - Going to convert document batch...
2025-11-14 17:44:39,806 - INFO - Processing document 4_2024-05-15
2025-11-14 17:44:39,899 - INFO - Finished converting document 4_2024-05-15 in 0.12 sec.


Converted 'data\edgar_documents\TMUS\4_2024-05-14' --> 'data\processed_data\TMUS\4_2024-05-14.md'
Converted 'data\edgar_documents\TMUS\4_2024-05-15' --> 'data\processed_data\TMUS\4_2024-05-15.md'


2025-11-14 17:44:39,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:40,028 - INFO - Going to convert document batch...
2025-11-14 17:44:40,029 - INFO - Processing document 4_2024-05-16
2025-11-14 17:44:40,108 - INFO - Finished converting document 4_2024-05-16 in 0.16 sec.
2025-11-14 17:44:40,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:40,202 - INFO - Going to convert document batch...
2025-11-14 17:44:40,204 - INFO - Processing document 4_2024-05-17
2025-11-14 17:44:40,243 - INFO - Finished converting document 4_2024-05-17 in 0.06 sec.
2025-11-14 17:44:40,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:40,344 - INFO - Going to convert document batch...
2025-11-14 17:44:40,347 - INFO - Processing document 4_2024-05-21


Converted 'data\edgar_documents\TMUS\4_2024-05-16' --> 'data\processed_data\TMUS\4_2024-05-16.md'
Converted 'data\edgar_documents\TMUS\4_2024-05-17' --> 'data\processed_data\TMUS\4_2024-05-17.md'


2025-11-14 17:44:40,484 - INFO - Finished converting document 4_2024-05-21 in 0.20 sec.
2025-11-14 17:44:40,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:40,608 - INFO - Going to convert document batch...
2025-11-14 17:44:40,609 - INFO - Processing document 4_2024-05-23
2025-11-14 17:44:40,700 - INFO - Finished converting document 4_2024-05-23 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\4_2024-05-21' --> 'data\processed_data\TMUS\4_2024-05-21.md'
Converted 'data\edgar_documents\TMUS\4_2024-05-23' --> 'data\processed_data\TMUS\4_2024-05-23.md'


2025-11-14 17:44:40,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:40,820 - INFO - Going to convert document batch...
2025-11-14 17:44:40,821 - INFO - Processing document 4_2024-05-28
2025-11-14 17:44:40,936 - INFO - Finished converting document 4_2024-05-28 in 0.17 sec.
2025-11-14 17:44:41,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:41,062 - INFO - Going to convert document batch...
2025-11-14 17:44:41,063 - INFO - Processing document 4_2024-05-30
2025-11-14 17:44:41,141 - INFO - Finished converting document 4_2024-05-30 in 0.12 sec.


Converted 'data\edgar_documents\TMUS\4_2024-05-28' --> 'data\processed_data\TMUS\4_2024-05-28.md'


2025-11-14 17:44:41,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:41,271 - INFO - Going to convert document batch...
2025-11-14 17:44:41,272 - INFO - Processing document 4_2024-06-04
2025-11-14 17:44:41,387 - INFO - Finished converting document 4_2024-06-04 in 0.19 sec.


Converted 'data\edgar_documents\TMUS\4_2024-05-30' --> 'data\processed_data\TMUS\4_2024-05-30.md'


2025-11-14 17:44:41,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:41,603 - INFO - Going to convert document batch...
2025-11-14 17:44:41,604 - INFO - Processing document 4_2024-06-06


Converted 'data\edgar_documents\TMUS\4_2024-06-04' --> 'data\processed_data\TMUS\4_2024-06-04.md'


2025-11-14 17:44:41,730 - INFO - Finished converting document 4_2024-06-06 in 0.23 sec.
2025-11-14 17:44:41,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:41,874 - INFO - Going to convert document batch...
2025-11-14 17:44:41,877 - INFO - Processing document 4_2024-06-07
2025-11-14 17:44:42,001 - INFO - Finished converting document 4_2024-06-07 in 0.19 sec.


Converted 'data\edgar_documents\TMUS\4_2024-06-06' --> 'data\processed_data\TMUS\4_2024-06-06.md'


2025-11-14 17:44:42,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:42,142 - INFO - Going to convert document batch...
2025-11-14 17:44:42,143 - INFO - Processing document 4_2024-06-11
2025-11-14 17:44:42,236 - INFO - Finished converting document 4_2024-06-11 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2024-06-07' --> 'data\processed_data\TMUS\4_2024-06-07.md'


2025-11-14 17:44:42,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:42,337 - INFO - Going to convert document batch...
2025-11-14 17:44:42,338 - INFO - Processing document 4_2024-06-12
2025-11-14 17:44:42,373 - INFO - Finished converting document 4_2024-06-12 in 0.06 sec.
2025-11-14 17:44:42,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:42,463 - INFO - Going to convert document batch...
2025-11-14 17:44:42,465 - INFO - Processing document 4_2024-06-13


Converted 'data\edgar_documents\TMUS\4_2024-06-11' --> 'data\processed_data\TMUS\4_2024-06-11.md'
Converted 'data\edgar_documents\TMUS\4_2024-06-12' --> 'data\processed_data\TMUS\4_2024-06-12.md'


2025-11-14 17:44:42,570 - INFO - Finished converting document 4_2024-06-13 in 0.16 sec.
2025-11-14 17:44:42,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:42,705 - INFO - Going to convert document batch...
2025-11-14 17:44:42,707 - INFO - Processing document 4_2024-06-17
2025-11-14 17:44:42,791 - INFO - Finished converting document 4_2024-06-17 in 0.12 sec.
2025-11-14 17:44:42,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2024-06-13' --> 'data\processed_data\TMUS\4_2024-06-13.md'
Converted 'data\edgar_documents\TMUS\4_2024-06-17' --> 'data\processed_data\TMUS\4_2024-06-17.md'


2025-11-14 17:44:42,918 - INFO - Going to convert document batch...
2025-11-14 17:44:42,920 - INFO - Processing document 4_2024-06-18
2025-11-14 17:44:43,018 - INFO - Finished converting document 4_2024-06-18 in 0.19 sec.
2025-11-14 17:44:43,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:43,189 - INFO - Going to convert document batch...
2025-11-14 17:44:43,190 - INFO - Processing document 4_2024-06-20
2025-11-14 17:44:43,266 - INFO - Finished converting document 4_2024-06-20 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2024-06-18' --> 'data\processed_data\TMUS\4_2024-06-18.md'


2025-11-14 17:44:43,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:43,487 - INFO - Going to convert document batch...
2025-11-14 17:44:43,489 - INFO - Processing document 4_2024-06-25


Converted 'data\edgar_documents\TMUS\4_2024-06-20' --> 'data\processed_data\TMUS\4_2024-06-20.md'


2025-11-14 17:44:43,599 - INFO - Finished converting document 4_2024-06-25 in 0.22 sec.
2025-11-14 17:44:43,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:43,774 - INFO - Going to convert document batch...
2025-11-14 17:44:43,776 - INFO - Processing document 4_2024-06-28
2025-11-14 17:44:43,869 - INFO - Finished converting document 4_2024-06-28 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\4_2024-06-25' --> 'data\processed_data\TMUS\4_2024-06-25.md'


2025-11-14 17:44:43,977 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:43,993 - INFO - Going to convert document batch...
2025-11-14 17:44:43,994 - INFO - Processing document 4_2024-07-02
2025-11-14 17:44:44,027 - INFO - Finished converting document 4_2024-07-02 in 0.08 sec.
2025-11-14 17:44:44,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:44,096 - INFO - Going to convert document batch...
2025-11-14 17:44:44,097 - INFO - Processing document 4_2024-08-02
2025-11-14 17:44:44,138 - INFO - Finished converting document 4_2024-08-02 in 0.08 sec.


Converted 'data\edgar_documents\TMUS\4_2024-06-28' --> 'data\processed_data\TMUS\4_2024-06-28.md'
Converted 'data\edgar_documents\TMUS\4_2024-07-02' --> 'data\processed_data\TMUS\4_2024-07-02.md'


2025-11-14 17:44:44,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:44,232 - INFO - Going to convert document batch...
2025-11-14 17:44:44,234 - INFO - Processing document 4_2024-08-09
2025-11-14 17:44:44,281 - INFO - Finished converting document 4_2024-08-09 in 0.11 sec.
2025-11-14 17:44:44,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:44,357 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMUS\4_2024-08-02' --> 'data\processed_data\TMUS\4_2024-08-02.md'
Converted 'data\edgar_documents\TMUS\4_2024-08-09' --> 'data\processed_data\TMUS\4_2024-08-09.md'


2025-11-14 17:44:44,358 - INFO - Processing document 4_2024-08-14
2025-11-14 17:44:44,396 - INFO - Finished converting document 4_2024-08-14 in 0.06 sec.
2025-11-14 17:44:44,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:44,481 - INFO - Going to convert document batch...
2025-11-14 17:44:44,483 - INFO - Processing document 4_2024-08-21
2025-11-14 17:44:44,519 - INFO - Finished converting document 4_2024-08-21 in 0.06 sec.
2025-11-14 17:44:44,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:44,588 - INFO - Going to convert document batch...
2025-11-14 17:44:44,589 - INFO - Processing document 4_2024-08-22
2025-11-14 17:44:44,633 - INFO - Finished converting document 4_2024-08-22 in 0.08 sec.


Converted 'data\edgar_documents\TMUS\4_2024-08-14' --> 'data\processed_data\TMUS\4_2024-08-14.md'
Converted 'data\edgar_documents\TMUS\4_2024-08-21' --> 'data\processed_data\TMUS\4_2024-08-21.md'


2025-11-14 17:44:44,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:44,724 - INFO - Going to convert document batch...
2025-11-14 17:44:44,726 - INFO - Processing document 4_2024-08-27
2025-11-14 17:44:44,786 - INFO - Finished converting document 4_2024-08-27 in 0.11 sec.


Converted 'data\edgar_documents\TMUS\4_2024-08-22' --> 'data\processed_data\TMUS\4_2024-08-22.md'
Converted 'data\edgar_documents\TMUS\4_2024-08-27' --> 'data\processed_data\TMUS\4_2024-08-27.md'


2025-11-14 17:44:44,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:44,937 - INFO - Going to convert document batch...
2025-11-14 17:44:44,939 - INFO - Processing document 4_2024-09-11
2025-11-14 17:44:44,971 - INFO - Finished converting document 4_2024-09-11 in 0.11 sec.
2025-11-14 17:44:45,031 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:45,032 - ERROR - Input document 4_2024-09-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:44

Converted 'data\edgar_documents\TMUS\4_2024-09-11' --> 'data\processed_data\TMUS\4_2024-09-11.md'
Error processing data\edgar_documents\TMUS\4_2024-09-23: File format not allowed: data\edgar_documents\TMUS\4_2024-09-23
Error processing data\edgar_documents\TMUS\4_2024-09-25: File format not allowed: data\edgar_documents\TMUS\4_2024-09-25
Converted 'data\edgar_documents\TMUS\4_2024-10-02' --> 'data\processed_data\TMUS\4_2024-10-02.md'


2025-11-14 17:44:45,206 - INFO - Processing document 4_2024-10-15
2025-11-14 17:44:45,262 - INFO - Finished converting document 4_2024-10-15 in 0.11 sec.
2025-11-14 17:44:45,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:45,339 - INFO - Going to convert document batch...
2025-11-14 17:44:45,340 - INFO - Processing document 4_2024-10-18


Converted 'data\edgar_documents\TMUS\4_2024-10-15' --> 'data\processed_data\TMUS\4_2024-10-15.md'


2025-11-14 17:44:45,724 - INFO - Finished converting document 4_2024-10-18 in 0.41 sec.
2025-11-14 17:44:45,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:45,850 - INFO - Going to convert document batch...
2025-11-14 17:44:45,852 - INFO - Processing document 4_2024-10-29
2025-11-14 17:44:45,923 - INFO - Finished converting document 4_2024-10-29 in 0.12 sec.


Converted 'data\edgar_documents\TMUS\4_2024-10-18' --> 'data\processed_data\TMUS\4_2024-10-18.md'
Converted 'data\edgar_documents\TMUS\4_2024-10-29' --> 'data\processed_data\TMUS\4_2024-10-29.md'


2025-11-14 17:44:45,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:46,000 - INFO - Going to convert document batch...
2025-11-14 17:44:46,002 - INFO - Processing document 4_2024-11-06
2025-11-14 17:44:46,051 - INFO - Finished converting document 4_2024-11-06 in 0.09 sec.
2025-11-14 17:44:46,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:46,129 - INFO - Going to convert document batch...
2025-11-14 17:44:46,130 - INFO - Processing document 4_2024-11-12
2025-11-14 17:44:46,191 - INFO - Finished converting document 4_2024-11-12 in 0.09 sec.
2025-11-14 17:44:46,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:46,271 - INFO - Going to convert document batch...
2025-11-14 17:44:46,272 - INFO - Processing document 4_2024-11-13


Converted 'data\edgar_documents\TMUS\4_2024-11-06' --> 'data\processed_data\TMUS\4_2024-11-06.md'
Converted 'data\edgar_documents\TMUS\4_2024-11-12' --> 'data\processed_data\TMUS\4_2024-11-12.md'


2025-11-14 17:44:46,311 - INFO - Finished converting document 4_2024-11-13 in 0.08 sec.
2025-11-14 17:44:46,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:46,424 - INFO - Going to convert document batch...
2025-11-14 17:44:46,425 - INFO - Processing document 4_2024-11-18
2025-11-14 17:44:46,478 - INFO - Finished converting document 4_2024-11-18 in 0.09 sec.
2025-11-14 17:44:46,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2024-11-13' --> 'data\processed_data\TMUS\4_2024-11-13.md'
Converted 'data\edgar_documents\TMUS\4_2024-11-18' --> 'data\processed_data\TMUS\4_2024-11-18.md'


2025-11-14 17:44:46,604 - INFO - Going to convert document batch...
2025-11-14 17:44:46,607 - INFO - Processing document 4_2024-12-02
2025-11-14 17:44:46,668 - INFO - Finished converting document 4_2024-12-02 in 0.14 sec.
2025-11-14 17:44:46,727 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:46,744 - INFO - Going to convert document batch...
2025-11-14 17:44:46,745 - INFO - Processing document 4_2024-12-11
2025-11-14 17:44:46,784 - INFO - Finished converting document 4_2024-12-11 in 0.08 sec.
2025-11-14 17:44:46,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:46,868 - INFO - Going to convert document batch...
2025-11-14 17:44:46,870 - INFO - Processing document 4_2024-12-17


Converted 'data\edgar_documents\TMUS\4_2024-12-02' --> 'data\processed_data\TMUS\4_2024-12-02.md'
Converted 'data\edgar_documents\TMUS\4_2024-12-11' --> 'data\processed_data\TMUS\4_2024-12-11.md'


2025-11-14 17:44:46,914 - INFO - Finished converting document 4_2024-12-17 in 0.09 sec.
2025-11-14 17:44:46,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:47,014 - INFO - Going to convert document batch...
2025-11-14 17:44:47,015 - INFO - Processing document 4_2025-01-03
2025-11-14 17:44:47,064 - INFO - Finished converting document 4_2025-01-03 in 0.12 sec.


Converted 'data\edgar_documents\TMUS\4_2024-12-17' --> 'data\processed_data\TMUS\4_2024-12-17.md'


2025-11-14 17:44:47,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:47,150 - INFO - Going to convert document batch...
2025-11-14 17:44:47,151 - INFO - Processing document 4_2025-02-04
2025-11-14 17:44:47,184 - INFO - Finished converting document 4_2025-02-04 in 0.06 sec.
2025-11-14 17:44:47,269 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:47,270 - ERROR - Input document 4_2025-02-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:44

Converted 'data\edgar_documents\TMUS\4_2025-01-03' --> 'data\processed_data\TMUS\4_2025-01-03.md'
Converted 'data\edgar_documents\TMUS\4_2025-02-04' --> 'data\processed_data\TMUS\4_2025-02-04.md'
Error processing data\edgar_documents\TMUS\4_2025-02-06: File format not allowed: data\edgar_documents\TMUS\4_2025-02-06


2025-11-14 17:44:47,319 - INFO - Going to convert document batch...
2025-11-14 17:44:47,321 - INFO - Processing document 4_2025-02-19
2025-11-14 17:44:47,384 - INFO - Finished converting document 4_2025-02-19 in 0.11 sec.
2025-11-14 17:44:47,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:47,506 - INFO - Going to convert document batch...
2025-11-14 17:44:47,507 - INFO - Processing document 4_2025-02-21
2025-11-14 17:44:47,554 - INFO - Finished converting document 4_2025-02-21 in 0.09 sec.
2025-11-14 17:44:47,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:47,619 - INFO - Going to convert document batch...
2025-11-14 17:44:47,621 - INFO - Processing document 4_2025-02-25


Converted 'data\edgar_documents\TMUS\4_2025-02-19' --> 'data\processed_data\TMUS\4_2025-02-19.md'
Converted 'data\edgar_documents\TMUS\4_2025-02-21' --> 'data\processed_data\TMUS\4_2025-02-21.md'


2025-11-14 17:44:47,692 - INFO - Finished converting document 4_2025-02-25 in 0.09 sec.
2025-11-14 17:44:47,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:47,785 - INFO - Going to convert document batch...
2025-11-14 17:44:47,786 - INFO - Processing document 4_2025-02-27
2025-11-14 17:44:47,821 - INFO - Finished converting document 4_2025-02-27 in 0.06 sec.
2025-11-14 17:44:47,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:47,895 - INFO - Going to convert document batch...
2025-11-14 17:44:47,896 - INFO - Processing document 4_2025-03-03
2025-11-14 17:44:47,929 - INFO - Finished converting document 4_2025-03-03 in 0.06 sec.


Converted 'data\edgar_documents\TMUS\4_2025-02-25' --> 'data\processed_data\TMUS\4_2025-02-25.md'
Converted 'data\edgar_documents\TMUS\4_2025-02-27' --> 'data\processed_data\TMUS\4_2025-02-27.md'


2025-11-14 17:44:47,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:48,008 - INFO - Going to convert document batch...
2025-11-14 17:44:48,011 - INFO - Processing document 4_2025-03-04
2025-11-14 17:44:48,048 - INFO - Finished converting document 4_2025-03-04 in 0.09 sec.
2025-11-14 17:44:48,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:48,153 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMUS\4_2025-03-03' --> 'data\processed_data\TMUS\4_2025-03-03.md'
Converted 'data\edgar_documents\TMUS\4_2025-03-04' --> 'data\processed_data\TMUS\4_2025-03-04.md'


2025-11-14 17:44:48,155 - INFO - Processing document 4_2025-03-06
2025-11-14 17:44:48,207 - INFO - Finished converting document 4_2025-03-06 in 0.11 sec.
2025-11-14 17:44:48,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:48,274 - INFO - Going to convert document batch...
2025-11-14 17:44:48,275 - INFO - Processing document 4_2025-03-10
2025-11-14 17:44:48,311 - INFO - Finished converting document 4_2025-03-10 in 0.08 sec.
2025-11-14 17:44:48,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:48,380 - INFO - Going to convert document batch...
2025-11-14 17:44:48,389 - INFO - Processing document 4_2025-03-17


Converted 'data\edgar_documents\TMUS\4_2025-03-06' --> 'data\processed_data\TMUS\4_2025-03-06.md'
Converted 'data\edgar_documents\TMUS\4_2025-03-10' --> 'data\processed_data\TMUS\4_2025-03-10.md'


2025-11-14 17:44:48,433 - INFO - Finished converting document 4_2025-03-17 in 0.09 sec.
2025-11-14 17:44:48,519 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:48,520 - ERROR - Input document 4_2025-03-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:44:48,522 - INFO - Going to convert document batch...
2025-11-14 17:44:48,551 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:48,552 - ERROR - Input document 4_2025-03-26 with forma

Converted 'data\edgar_documents\TMUS\4_2025-03-17' --> 'data\processed_data\TMUS\4_2025-03-17.md'
Error processing data\edgar_documents\TMUS\4_2025-03-24: File format not allowed: data\edgar_documents\TMUS\4_2025-03-24
Error processing data\edgar_documents\TMUS\4_2025-03-26: File format not allowed: data\edgar_documents\TMUS\4_2025-03-26
Converted 'data\edgar_documents\TMUS\4_2025-04-03' --> 'data\processed_data\TMUS\4_2025-04-03.md'


2025-11-14 17:44:48,693 - INFO - Going to convert document batch...
2025-11-14 17:44:48,694 - INFO - Processing document 4_2025-05-05
2025-11-14 17:44:48,725 - INFO - Finished converting document 4_2025-05-05 in 0.06 sec.
2025-11-14 17:44:48,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:48,824 - INFO - Going to convert document batch...
2025-11-14 17:44:48,825 - INFO - Processing document 4_2025-05-16
2025-11-14 17:44:48,859 - INFO - Finished converting document 4_2025-05-16 in 0.08 sec.
2025-11-14 17:44:48,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:48,937 - INFO - Going to convert document batch...
2025-11-14 17:44:48,938 - INFO - Processing document 4_2025-05-21
2025-11-14 17:44:48,974 - INFO - Finished converting document 4_2025-05-21 in 0.08 sec.


Converted 'data\edgar_documents\TMUS\4_2025-05-05' --> 'data\processed_data\TMUS\4_2025-05-05.md'
Converted 'data\edgar_documents\TMUS\4_2025-05-16' --> 'data\processed_data\TMUS\4_2025-05-16.md'


2025-11-14 17:44:49,059 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:44:49,059 - ERROR - Input document 4_2025-05-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:44:49,062 - INFO - Going to convert document batch...
2025-11-14 17:44:49,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:49,098 - INFO - Going to convert document batch...
2025-11-14 17:44:49,099 - INFO - Processing document 4_2025-06-10
2025-11-14 17:44:49,137 - INFO - Fin

Converted 'data\edgar_documents\TMUS\4_2025-05-21' --> 'data\processed_data\TMUS\4_2025-05-21.md'
Error processing data\edgar_documents\TMUS\4_2025-05-23: File format not allowed: data\edgar_documents\TMUS\4_2025-05-23
Converted 'data\edgar_documents\TMUS\4_2025-06-10' --> 'data\processed_data\TMUS\4_2025-06-10.md'


2025-11-14 17:44:49,230 - INFO - Going to convert document batch...
2025-11-14 17:44:49,232 - INFO - Processing document 4_2025-06-16
2025-11-14 17:44:49,331 - INFO - Finished converting document 4_2025-06-16 in 0.16 sec.
2025-11-14 17:44:49,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:49,444 - INFO - Going to convert document batch...
2025-11-14 17:44:49,446 - INFO - Processing document 4_2025-06-17
2025-11-14 17:44:49,502 - INFO - Finished converting document 4_2025-06-17 in 0.09 sec.
2025-11-14 17:44:49,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2025-06-16' --> 'data\processed_data\TMUS\4_2025-06-16.md'
Converted 'data\edgar_documents\TMUS\4_2025-06-17' --> 'data\processed_data\TMUS\4_2025-06-17.md'


2025-11-14 17:44:49,636 - INFO - Going to convert document batch...
2025-11-14 17:44:49,639 - INFO - Processing document 4_2025-06-20
2025-11-14 17:44:49,810 - INFO - Finished converting document 4_2025-06-20 in 0.27 sec.
2025-11-14 17:44:49,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:49,952 - INFO - Going to convert document batch...
2025-11-14 17:44:49,954 - INFO - Processing document 4_2025-06-25


Converted 'data\edgar_documents\TMUS\4_2025-06-20' --> 'data\processed_data\TMUS\4_2025-06-20.md'


2025-11-14 17:44:50,156 - INFO - Finished converting document 4_2025-06-25 in 0.27 sec.
2025-11-14 17:44:50,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:50,370 - INFO - Going to convert document batch...
2025-11-14 17:44:50,372 - INFO - Processing document 4_2025-06-30


Converted 'data\edgar_documents\TMUS\4_2025-06-25' --> 'data\processed_data\TMUS\4_2025-06-25.md'


2025-11-14 17:44:50,482 - INFO - Finished converting document 4_2025-06-30 in 0.20 sec.
2025-11-14 17:44:50,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:50,727 - INFO - Going to convert document batch...
2025-11-14 17:44:50,730 - INFO - Processing document 4_2025-07-03


Converted 'data\edgar_documents\TMUS\4_2025-06-30' --> 'data\processed_data\TMUS\4_2025-06-30.md'


2025-11-14 17:44:50,905 - INFO - Finished converting document 4_2025-07-03 in 0.28 sec.
2025-11-14 17:44:51,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:51,067 - INFO - Going to convert document batch...
2025-11-14 17:44:51,068 - INFO - Processing document 4_2025-07-08
2025-11-14 17:44:51,167 - INFO - Finished converting document 4_2025-07-08 in 0.19 sec.


Converted 'data\edgar_documents\TMUS\4_2025-07-03' --> 'data\processed_data\TMUS\4_2025-07-03.md'


2025-11-14 17:44:51,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:51,303 - INFO - Going to convert document batch...
2025-11-14 17:44:51,304 - INFO - Processing document 4_2025-07-11


Converted 'data\edgar_documents\TMUS\4_2025-07-08' --> 'data\processed_data\TMUS\4_2025-07-08.md'


2025-11-14 17:44:51,477 - INFO - Finished converting document 4_2025-07-11 in 0.24 sec.
2025-11-14 17:44:51,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:51,615 - INFO - Going to convert document batch...
2025-11-14 17:44:51,616 - INFO - Processing document 4_2025-07-16
2025-11-14 17:44:51,734 - INFO - Finished converting document 4_2025-07-16 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\4_2025-07-11' --> 'data\processed_data\TMUS\4_2025-07-11.md'


2025-11-14 17:44:51,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:51,871 - INFO - Going to convert document batch...
2025-11-14 17:44:51,873 - INFO - Processing document 4_2025-07-21
2025-11-14 17:44:51,972 - INFO - Finished converting document 4_2025-07-21 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2025-07-16' --> 'data\processed_data\TMUS\4_2025-07-16.md'


2025-11-14 17:44:52,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:52,116 - INFO - Going to convert document batch...
2025-11-14 17:44:52,117 - INFO - Processing document 4_2025-07-24


Converted 'data\edgar_documents\TMUS\4_2025-07-21' --> 'data\processed_data\TMUS\4_2025-07-21.md'


2025-11-14 17:44:52,250 - INFO - Finished converting document 4_2025-07-24 in 0.20 sec.
2025-11-14 17:44:52,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:52,392 - INFO - Going to convert document batch...
2025-11-14 17:44:52,394 - INFO - Processing document 4_2025-07-28
2025-11-14 17:44:52,433 - INFO - Finished converting document 4_2025-07-28 in 0.08 sec.
2025-11-14 17:44:52,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2025-07-24' --> 'data\processed_data\TMUS\4_2025-07-24.md'
Converted 'data\edgar_documents\TMUS\4_2025-07-28' --> 'data\processed_data\TMUS\4_2025-07-28.md'


2025-11-14 17:44:53,029 - INFO - Going to convert document batch...
2025-11-14 17:44:53,032 - INFO - Processing document 4_2025-07-29
2025-11-14 17:44:53,232 - INFO - Finished converting document 4_2025-07-29 in 0.76 sec.
2025-11-14 17:44:53,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:53,400 - INFO - Going to convert document batch...
2025-11-14 17:44:53,402 - INFO - Processing document 4_2025-07-31


Converted 'data\edgar_documents\TMUS\4_2025-07-29' --> 'data\processed_data\TMUS\4_2025-07-29.md'


2025-11-14 17:44:53,522 - INFO - Finished converting document 4_2025-07-31 in 0.20 sec.
2025-11-14 17:44:53,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:53,672 - INFO - Going to convert document batch...
2025-11-14 17:44:53,673 - INFO - Processing document 4_2025-08-05


Converted 'data\edgar_documents\TMUS\4_2025-07-31' --> 'data\processed_data\TMUS\4_2025-07-31.md'


2025-11-14 17:44:53,794 - INFO - Finished converting document 4_2025-08-05 in 0.19 sec.
2025-11-14 17:44:53,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:54,027 - INFO - Going to convert document batch...
2025-11-14 17:44:54,027 - INFO - Processing document 4_2025-08-07


Converted 'data\edgar_documents\TMUS\4_2025-08-05' --> 'data\processed_data\TMUS\4_2025-08-05.md'


2025-11-14 17:44:54,153 - INFO - Finished converting document 4_2025-08-07 in 0.22 sec.
2025-11-14 17:44:54,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:54,395 - INFO - Going to convert document batch...
2025-11-14 17:44:54,398 - INFO - Processing document 4_2025-08-12


Converted 'data\edgar_documents\TMUS\4_2025-08-07' --> 'data\processed_data\TMUS\4_2025-08-07.md'


2025-11-14 17:44:54,538 - INFO - Finished converting document 4_2025-08-12 in 0.23 sec.
2025-11-14 17:44:54,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:54,708 - INFO - Going to convert document batch...
2025-11-14 17:44:54,709 - INFO - Processing document 4_2025-08-15
2025-11-14 17:44:54,804 - INFO - Finished converting document 4_2025-08-15 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2025-08-12' --> 'data\processed_data\TMUS\4_2025-08-12.md'


2025-11-14 17:44:54,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:55,007 - INFO - Going to convert document batch...
2025-11-14 17:44:55,008 - INFO - Processing document 4_2025-08-19
2025-11-14 17:44:55,060 - INFO - Finished converting document 4_2025-08-19 in 0.09 sec.
2025-11-14 17:44:55,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2025-08-15' --> 'data\processed_data\TMUS\4_2025-08-15.md'
Converted 'data\edgar_documents\TMUS\4_2025-08-19' --> 'data\processed_data\TMUS\4_2025-08-19.md'


2025-11-14 17:44:55,234 - INFO - Going to convert document batch...
2025-11-14 17:44:55,236 - INFO - Processing document 4_2025-08-20
2025-11-14 17:44:55,368 - INFO - Finished converting document 4_2025-08-20 in 0.25 sec.
2025-11-14 17:44:55,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:55,572 - INFO - Going to convert document batch...
2025-11-14 17:44:55,573 - INFO - Processing document 4_2025-08-25


Converted 'data\edgar_documents\TMUS\4_2025-08-20' --> 'data\processed_data\TMUS\4_2025-08-20.md'


2025-11-14 17:44:55,792 - INFO - Finished converting document 4_2025-08-25 in 0.33 sec.
2025-11-14 17:44:55,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:55,940 - INFO - Going to convert document batch...
2025-11-14 17:44:55,942 - INFO - Processing document 4_2025-08-26
2025-11-14 17:44:55,973 - INFO - Finished converting document 4_2025-08-26 in 0.06 sec.
2025-11-14 17:44:56,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:56,058 - INFO - Going to convert document batch...
2025-11-14 17:44:56,059 - INFO - Processing document 4_2025-08-28


Converted 'data\edgar_documents\TMUS\4_2025-08-25' --> 'data\processed_data\TMUS\4_2025-08-25.md'
Converted 'data\edgar_documents\TMUS\4_2025-08-26' --> 'data\processed_data\TMUS\4_2025-08-26.md'


2025-11-14 17:44:56,205 - INFO - Finished converting document 4_2025-08-28 in 0.20 sec.
2025-11-14 17:44:56,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:56,329 - INFO - Going to convert document batch...
2025-11-14 17:44:56,330 - INFO - Processing document 4_2025-08-29
2025-11-14 17:44:56,447 - INFO - Finished converting document 4_2025-08-29 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2025-08-28' --> 'data\processed_data\TMUS\4_2025-08-28.md'


2025-11-14 17:44:56,546 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:56,574 - INFO - Going to convert document batch...
2025-11-14 17:44:56,577 - INFO - Processing document 4_2025-09-03
2025-11-14 17:44:56,624 - INFO - Finished converting document 4_2025-09-03 in 0.11 sec.
2025-11-14 17:44:56,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2025-08-29' --> 'data\processed_data\TMUS\4_2025-08-29.md'
Converted 'data\edgar_documents\TMUS\4_2025-09-03' --> 'data\processed_data\TMUS\4_2025-09-03.md'


2025-11-14 17:44:56,729 - INFO - Going to convert document batch...
2025-11-14 17:44:56,731 - INFO - Processing document 4_2025-09-04
2025-11-14 17:44:56,919 - INFO - Finished converting document 4_2025-09-04 in 0.27 sec.
2025-11-14 17:44:57,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:57,079 - INFO - Going to convert document batch...
2025-11-14 17:44:57,084 - INFO - Processing document 4_2025-09-08


Converted 'data\edgar_documents\TMUS\4_2025-09-04' --> 'data\processed_data\TMUS\4_2025-09-04.md'


2025-11-14 17:44:57,342 - INFO - Finished converting document 4_2025-09-08 in 0.33 sec.
2025-11-14 17:44:57,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:57,543 - INFO - Going to convert document batch...
2025-11-14 17:44:57,546 - INFO - Processing document 4_2025-09-10
2025-11-14 17:44:57,653 - INFO - Finished converting document 4_2025-09-10 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\4_2025-09-08' --> 'data\processed_data\TMUS\4_2025-09-08.md'


2025-11-14 17:44:57,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2025-09-10' --> 'data\processed_data\TMUS\4_2025-09-10.md'


2025-11-14 17:44:58,019 - INFO - Going to convert document batch...
2025-11-14 17:44:58,022 - INFO - Processing document 4_2025-09-15
2025-11-14 17:44:58,091 - INFO - Finished converting document 4_2025-09-15 in 0.30 sec.
2025-11-14 17:44:58,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:58,212 - INFO - Going to convert document batch...
2025-11-14 17:44:58,213 - INFO - Processing document 4_2025-09-17
2025-11-14 17:44:58,317 - INFO - Finished converting document 4_2025-09-17 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\4_2025-09-15' --> 'data\processed_data\TMUS\4_2025-09-15.md'


2025-11-14 17:44:58,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:58,472 - INFO - Going to convert document batch...
2025-11-14 17:44:58,473 - INFO - Processing document 4_2025-09-22
2025-11-14 17:44:58,584 - INFO - Finished converting document 4_2025-09-22 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\4_2025-09-17' --> 'data\processed_data\TMUS\4_2025-09-17.md'


2025-11-14 17:44:58,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:58,756 - INFO - Going to convert document batch...
2025-11-14 17:44:58,758 - INFO - Processing document 4_2025-09-23
2025-11-14 17:44:58,830 - INFO - Finished converting document 4_2025-09-23 in 0.11 sec.


Converted 'data\edgar_documents\TMUS\4_2025-09-22' --> 'data\processed_data\TMUS\4_2025-09-22.md'
Converted 'data\edgar_documents\TMUS\4_2025-09-23' --> 'data\processed_data\TMUS\4_2025-09-23.md'


2025-11-14 17:44:58,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:58,969 - INFO - Going to convert document batch...
2025-11-14 17:44:58,971 - INFO - Processing document 4_2025-09-24
2025-11-14 17:44:59,075 - INFO - Finished converting document 4_2025-09-24 in 0.19 sec.
2025-11-14 17:44:59,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:44:59,207 - INFO - Going to convert document batch...
2025-11-14 17:44:59,208 - INFO - Processing document 4_2025-09-26


Converted 'data\edgar_documents\TMUS\4_2025-09-24' --> 'data\processed_data\TMUS\4_2025-09-24.md'


2025-11-14 17:44:59,375 - INFO - Finished converting document 4_2025-09-26 in 0.22 sec.
2025-11-14 17:44:59,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\4_2025-09-26' --> 'data\processed_data\TMUS\4_2025-09-26.md'


2025-11-14 17:45:00,119 - INFO - Going to convert document batch...
2025-11-14 17:45:00,122 - INFO - Processing document 4_2025-09-30
2025-11-14 17:45:00,273 - INFO - Finished converting document 4_2025-09-30 in 0.78 sec.
2025-11-14 17:45:00,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:00,454 - INFO - Going to convert document batch...
2025-11-14 17:45:00,457 - INFO - Processing document 4_2025-10-02


Converted 'data\edgar_documents\TMUS\4_2025-09-30' --> 'data\processed_data\TMUS\4_2025-09-30.md'


2025-11-14 17:45:00,647 - INFO - Finished converting document 4_2025-10-02 in 0.28 sec.
2025-11-14 17:45:00,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:00,846 - INFO - Going to convert document batch...
2025-11-14 17:45:00,848 - INFO - Processing document 4_2025-10-06


Converted 'data\edgar_documents\TMUS\4_2025-10-02' --> 'data\processed_data\TMUS\4_2025-10-02.md'


2025-11-14 17:45:00,966 - INFO - Finished converting document 4_2025-10-06 in 0.22 sec.
2025-11-14 17:45:01,084 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:45:01,085 - ERROR - Input document 4_2025-10-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:45:01,088 - INFO - Going to convert document batch...
2025-11-14 17:45:01,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:01,223 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\TMUS\4_2025-10-06' --> 'data\processed_data\TMUS\4_2025-10-06.md'
Error processing data\edgar_documents\TMUS\4_2025-10-08: File format not allowed: data\edgar_documents\TMUS\4_2025-10-08


2025-11-14 17:45:01,356 - INFO - Finished converting document 4_2025-10-10 in 0.26 sec.
2025-11-14 17:45:01,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:01,502 - INFO - Going to convert document batch...
2025-11-14 17:45:01,503 - INFO - Processing document 4_2025-10-14


Converted 'data\edgar_documents\TMUS\4_2025-10-10' --> 'data\processed_data\TMUS\4_2025-10-10.md'


2025-11-14 17:45:01,640 - INFO - Finished converting document 4_2025-10-14 in 0.22 sec.
2025-11-14 17:45:01,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:01,791 - INFO - Going to convert document batch...
2025-11-14 17:45:01,793 - INFO - Processing document 4_2025-10-17
2025-11-14 17:45:01,893 - INFO - Finished converting document 4_2025-10-17 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2025-10-14' --> 'data\processed_data\TMUS\4_2025-10-14.md'


2025-11-14 17:45:01,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:02,029 - INFO - Going to convert document batch...
2025-11-14 17:45:02,030 - INFO - Processing document 4_2025-10-21
2025-11-14 17:45:02,132 - INFO - Finished converting document 4_2025-10-21 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2025-10-17' --> 'data\processed_data\TMUS\4_2025-10-17.md'


2025-11-14 17:45:02,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:02,274 - INFO - Going to convert document batch...
2025-11-14 17:45:02,275 - INFO - Processing document 4_2025-10-23
2025-11-14 17:45:02,404 - INFO - Finished converting document 4_2025-10-23 in 0.19 sec.


Converted 'data\edgar_documents\TMUS\4_2025-10-21' --> 'data\processed_data\TMUS\4_2025-10-21.md'


2025-11-14 17:45:02,550 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:02,602 - INFO - Going to convert document batch...
2025-11-14 17:45:02,603 - INFO - Processing document 4_2025-10-27


Converted 'data\edgar_documents\TMUS\4_2025-10-23' --> 'data\processed_data\TMUS\4_2025-10-23.md'


2025-11-14 17:45:02,722 - INFO - Finished converting document 4_2025-10-27 in 0.19 sec.
2025-11-14 17:45:02,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:02,855 - INFO - Going to convert document batch...
2025-11-14 17:45:02,857 - INFO - Processing document 4_2025-10-29
2025-11-14 17:45:02,963 - INFO - Finished converting document 4_2025-10-29 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\4_2025-10-27' --> 'data\processed_data\TMUS\4_2025-10-27.md'


2025-11-14 17:45:03,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:03,105 - INFO - Going to convert document batch...
2025-11-14 17:45:03,106 - INFO - Processing document 4_2025-10-31
2025-11-14 17:45:03,178 - INFO - Finished converting document 4_2025-10-31 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\4_2025-10-29' --> 'data\processed_data\TMUS\4_2025-10-29.md'
Converted 'data\edgar_documents\TMUS\4_2025-10-31' --> 'data\processed_data\TMUS\4_2025-10-31.md'


2025-11-14 17:45:03,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:03,268 - INFO - Going to convert document batch...
2025-11-14 17:45:03,270 - INFO - Processing document 4_2025-11-04
2025-11-14 17:45:03,306 - INFO - Finished converting document 4_2025-11-04 in 0.06 sec.
2025-11-14 17:45:03,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:03,385 - INFO - Going to convert document batch...
2025-11-14 17:45:03,386 - INFO - Processing document 4_2025-11-10
2025-11-14 17:45:03,431 - INFO - Finished converting document 4_2025-11-10 in 0.08 sec.
2025-11-14 17:45:03,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:03,511 - INFO - Going to convert document batch...
2025-11-14 17:45:03,513 - INFO - Processing document 8-K_2023-01-04


Converted 'data\edgar_documents\TMUS\4_2025-11-04' --> 'data\processed_data\TMUS\4_2025-11-04.md'
Converted 'data\edgar_documents\TMUS\4_2025-11-10' --> 'data\processed_data\TMUS\4_2025-11-10.md'


2025-11-14 17:45:03,541 - INFO - Finished converting document 8-K_2023-01-04 in 0.08 sec.
2025-11-14 17:45:03,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:03,610 - INFO - Going to convert document batch...
2025-11-14 17:45:03,611 - INFO - Processing document 8-K_2023-01-19
2025-11-14 17:45:03,635 - INFO - Finished converting document 8-K_2023-01-19 in 0.09 sec.
2025-11-14 17:45:03,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:03,699 - INFO - Going to convert document batch...
2025-11-14 17:45:03,700 - INFO - Processing document 8-K_2023-02-01


Converted 'data\edgar_documents\TMUS\8-K_2023-01-04' --> 'data\processed_data\TMUS\8-K_2023-01-04.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-01-19' --> 'data\processed_data\TMUS\8-K_2023-01-19.md'


2025-11-14 17:45:03,741 - INFO - Finished converting document 8-K_2023-02-01 in 0.08 sec.
2025-11-14 17:45:03,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:03,803 - INFO - Going to convert document batch...
2025-11-14 17:45:03,805 - INFO - Processing document 8-K_2023-02-03
2025-11-14 17:45:03,831 - INFO - Finished converting document 8-K_2023-02-03 in 0.06 sec.
2025-11-14 17:45:03,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:03,939 - INFO - Going to convert document batch...
2025-11-14 17:45:03,940 - INFO - Processing document 8-K_2023-02-09


Converted 'data\edgar_documents\TMUS\8-K_2023-02-01' --> 'data\processed_data\TMUS\8-K_2023-02-01.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-02-03' --> 'data\processed_data\TMUS\8-K_2023-02-03.md'


2025-11-14 17:45:03,999 - INFO - Finished converting document 8-K_2023-02-09 in 0.14 sec.
2025-11-14 17:45:04,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:04,086 - INFO - Going to convert document batch...
2025-11-14 17:45:04,087 - INFO - Processing document 8-K_2023-02-13
2025-11-14 17:45:04,116 - INFO - Finished converting document 8-K_2023-02-13 in 0.08 sec.
2025-11-14 17:45:04,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:04,211 - INFO - Going to convert document batch...
2025-11-14 17:45:04,213 - INFO - Processing document 8-K_2023-03-10


Converted 'data\edgar_documents\TMUS\8-K_2023-02-09' --> 'data\processed_data\TMUS\8-K_2023-02-09.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-02-13' --> 'data\processed_data\TMUS\8-K_2023-02-13.md'


2025-11-14 17:45:04,270 - INFO - Finished converting document 8-K_2023-03-10 in 0.12 sec.
2025-11-14 17:45:04,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:04,376 - INFO - Going to convert document batch...
2025-11-14 17:45:04,378 - INFO - Processing document 8-K_2023-03-20
2025-11-14 17:45:04,448 - INFO - Finished converting document 8-K_2023-03-20 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\8-K_2023-03-10' --> 'data\processed_data\TMUS\8-K_2023-03-10.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-03-20' --> 'data\processed_data\TMUS\8-K_2023-03-20.md'


2025-11-14 17:45:04,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:04,555 - INFO - Going to convert document batch...
2025-11-14 17:45:04,556 - INFO - Processing document 8-K_2023-04-27
2025-11-14 17:45:04,589 - INFO - Finished converting document 8-K_2023-04-27 in 0.09 sec.
2025-11-14 17:45:04,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:04,646 - INFO - Going to convert document batch...
2025-11-14 17:45:04,648 - INFO - Processing document 8-K_2023-05-01
2025-11-14 17:45:04,696 - INFO - Finished converting document 8-K_2023-05-01 in 0.08 sec.
2025-11-14 17:45:04,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:04,773 - INFO - Going to convert document batch...
2025-11-14 17:45:04,774 - INFO - Processing document 8-K_2023-05-11


Converted 'data\edgar_documents\TMUS\8-K_2023-04-27' --> 'data\processed_data\TMUS\8-K_2023-04-27.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-05-01' --> 'data\processed_data\TMUS\8-K_2023-05-01.md'


2025-11-14 17:45:04,819 - INFO - Finished converting document 8-K_2023-05-11 in 0.09 sec.
2025-11-14 17:45:04,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:04,924 - INFO - Going to convert document batch...
2025-11-14 17:45:04,925 - INFO - Processing document 8-K_2023-06-21
2025-11-14 17:45:05,021 - INFO - Finished converting document 8-K_2023-06-21 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\8-K_2023-05-11' --> 'data\processed_data\TMUS\8-K_2023-05-11.md'


2025-11-14 17:45:05,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:05,120 - INFO - Going to convert document batch...
2025-11-14 17:45:05,121 - INFO - Processing document 8-K_2023-07-11
2025-11-14 17:45:05,181 - INFO - Finished converting document 8-K_2023-07-11 in 0.09 sec.
2025-11-14 17:45:05,238 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:05,266 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMUS\8-K_2023-06-21' --> 'data\processed_data\TMUS\8-K_2023-06-21.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-07-11' --> 'data\processed_data\TMUS\8-K_2023-07-11.md'


2025-11-14 17:45:05,269 - INFO - Processing document 8-K_2023-07-20
2025-11-14 17:45:05,323 - INFO - Finished converting document 8-K_2023-07-20 in 0.12 sec.
2025-11-14 17:45:05,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:05,382 - INFO - Going to convert document batch...
2025-11-14 17:45:05,384 - INFO - Processing document 8-K_2023-07-27
2025-11-14 17:45:05,415 - INFO - Finished converting document 8-K_2023-07-27 in 0.06 sec.
2025-11-14 17:45:05,456 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:05,473 - INFO - Going to convert document batch...
2025-11-14 17:45:05,474 - INFO - Processing document 8-K_2023-08-24
2025-11-14 17:45:05,502 - INFO - Finished converting document 8-K_2023-08-24 in 0.06 sec.


Converted 'data\edgar_documents\TMUS\8-K_2023-07-20' --> 'data\processed_data\TMUS\8-K_2023-07-20.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-07-27' --> 'data\processed_data\TMUS\8-K_2023-07-27.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-08-24' --> 'data\processed_data\TMUS\8-K_2023-08-24.md'


2025-11-14 17:45:05,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:05,563 - INFO - Going to convert document batch...
2025-11-14 17:45:05,564 - INFO - Processing document 8-K_2023-09-06
2025-11-14 17:45:05,592 - INFO - Finished converting document 8-K_2023-09-06 in 0.08 sec.
2025-11-14 17:45:05,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:05,664 - INFO - Going to convert document batch...
2025-11-14 17:45:05,664 - INFO - Processing document 8-K_2023-09-08
2025-11-14 17:45:05,702 - INFO - Finished converting document 8-K_2023-09-08 in 0.08 sec.
2025-11-14 17:45:05,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:05,776 - INFO - Going to convert document batch...
2025-11-14 17:45:05,778 - INFO - Processing document 8-K_2023-09-12


Converted 'data\edgar_documents\TMUS\8-K_2023-09-06' --> 'data\processed_data\TMUS\8-K_2023-09-06.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-09-08' --> 'data\processed_data\TMUS\8-K_2023-09-08.md'


2025-11-14 17:45:05,836 - INFO - Finished converting document 8-K_2023-09-12 in 0.11 sec.
2025-11-14 17:45:05,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:05,941 - INFO - Going to convert document batch...
2025-11-14 17:45:05,942 - INFO - Processing document 8-K_2023-09-14
2025-11-14 17:45:05,997 - INFO - Finished converting document 8-K_2023-09-14 in 0.14 sec.


Converted 'data\edgar_documents\TMUS\8-K_2023-09-12' --> 'data\processed_data\TMUS\8-K_2023-09-12.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-09-14' --> 'data\processed_data\TMUS\8-K_2023-09-14.md'


2025-11-14 17:45:06,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:06,080 - INFO - Going to convert document batch...
2025-11-14 17:45:06,082 - INFO - Processing document 8-K_2023-09-25
2025-11-14 17:45:06,119 - INFO - Finished converting document 8-K_2023-09-25 in 0.11 sec.
2025-11-14 17:45:06,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:06,178 - INFO - Going to convert document batch...
2025-11-14 17:45:06,180 - INFO - Processing document 8-K_2023-10-25
2025-11-14 17:45:06,211 - INFO - Finished converting document 8-K_2023-10-25 in 0.06 sec.
2025-11-14 17:45:06,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:06,297 - INFO - Going to convert document batch...
2025-11-14 17:45:06,299 - INFO - Processing document 8-K_2023-12-26


Converted 'data\edgar_documents\TMUS\8-K_2023-09-25' --> 'data\processed_data\TMUS\8-K_2023-09-25.md'
Converted 'data\edgar_documents\TMUS\8-K_2023-10-25' --> 'data\processed_data\TMUS\8-K_2023-10-25.md'


2025-11-14 17:45:06,352 - INFO - Finished converting document 8-K_2023-12-26 in 0.11 sec.
2025-11-14 17:45:06,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:06,468 - INFO - Going to convert document batch...
2025-11-14 17:45:06,469 - INFO - Processing document 8-K_2024-01-12
2025-11-14 17:45:06,551 - INFO - Finished converting document 8-K_2024-01-12 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\8-K_2023-12-26' --> 'data\processed_data\TMUS\8-K_2023-12-26.md'


2025-11-14 17:45:06,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\8-K_2024-01-12' --> 'data\processed_data\TMUS\8-K_2024-01-12.md'


2025-11-14 17:45:07,172 - INFO - Going to convert document batch...
2025-11-14 17:45:07,174 - INFO - Processing document 8-K_2024-01-25
2025-11-14 17:45:07,250 - INFO - Finished converting document 8-K_2024-01-25 in 0.66 sec.
2025-11-14 17:45:07,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:07,334 - INFO - Going to convert document batch...
2025-11-14 17:45:07,337 - INFO - Processing document 8-K_2024-04-25
2025-11-14 17:45:07,380 - INFO - Finished converting document 8-K_2024-04-25 in 0.09 sec.
2025-11-14 17:45:07,429 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:45:07,430 - ERROR - Input document 8-K_2024-05-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.C

Converted 'data\edgar_documents\TMUS\8-K_2024-01-25' --> 'data\processed_data\TMUS\8-K_2024-01-25.md'
Converted 'data\edgar_documents\TMUS\8-K_2024-04-25' --> 'data\processed_data\TMUS\8-K_2024-04-25.md'
Error processing data\edgar_documents\TMUS\8-K_2024-05-08: File format not allowed: data\edgar_documents\TMUS\8-K_2024-05-08


2025-11-14 17:45:07,519 - INFO - Going to convert document batch...
2025-11-14 17:45:07,521 - INFO - Processing document 8-K_2024-06-14
2025-11-14 17:45:07,621 - INFO - Finished converting document 8-K_2024-06-14 in 0.19 sec.
2025-11-14 17:45:07,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:07,714 - INFO - Going to convert document batch...
2025-11-14 17:45:07,715 - INFO - Processing document 8-K_2024-07-24
2025-11-14 17:45:07,768 - INFO - Finished converting document 8-K_2024-07-24 in 0.11 sec.
2025-11-14 17:45:07,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\8-K_2024-06-14' --> 'data\processed_data\TMUS\8-K_2024-06-14.md'
Converted 'data\edgar_documents\TMUS\8-K_2024-07-24' --> 'data\processed_data\TMUS\8-K_2024-07-24.md'


2025-11-14 17:45:07,862 - INFO - Going to convert document batch...
2025-11-14 17:45:07,865 - INFO - Processing document 8-K_2024-07-31
2025-11-14 17:45:07,925 - INFO - Finished converting document 8-K_2024-07-31 in 0.12 sec.
2025-11-14 17:45:08,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:08,097 - INFO - Going to convert document batch...
2025-11-14 17:45:08,101 - INFO - Processing document 8-K_2024-09-13


Converted 'data\edgar_documents\TMUS\8-K_2024-07-31' --> 'data\processed_data\TMUS\8-K_2024-07-31.md'


2025-11-14 17:45:08,198 - INFO - Finished converting document 8-K_2024-09-13 in 0.23 sec.
2025-11-14 17:45:08,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:08,256 - INFO - Going to convert document batch...
2025-11-14 17:45:08,257 - INFO - Processing document 8-K_2024-09-18
2025-11-14 17:45:08,292 - INFO - Finished converting document 8-K_2024-09-18 in 0.08 sec.
2025-11-14 17:45:08,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:08,360 - INFO - Going to convert document batch...
2025-11-14 17:45:08,361 - INFO - Processing document 8-K_2024-09-26
2025-11-14 17:45:08,411 - INFO - Finished converting document 8-K_2024-09-26 in 0.09 sec.


Converted 'data\edgar_documents\TMUS\8-K_2024-09-13' --> 'data\processed_data\TMUS\8-K_2024-09-13.md'
Converted 'data\edgar_documents\TMUS\8-K_2024-09-18' --> 'data\processed_data\TMUS\8-K_2024-09-18.md'


2025-11-14 17:45:08,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:08,481 - INFO - Going to convert document batch...
2025-11-14 17:45:08,482 - INFO - Processing document 8-K_2024-10-23
2025-11-14 17:45:08,517 - INFO - Finished converting document 8-K_2024-10-23 in 0.08 sec.
2025-11-14 17:45:08,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:08,580 - INFO - Going to convert document batch...
2025-11-14 17:45:08,581 - INFO - Processing document 8-K_2024-12-10
2025-11-14 17:45:08,621 - INFO - Finished converting document 8-K_2024-12-10 in 0.09 sec.


Converted 'data\edgar_documents\TMUS\8-K_2024-09-26' --> 'data\processed_data\TMUS\8-K_2024-09-26.md'
Converted 'data\edgar_documents\TMUS\8-K_2024-10-23' --> 'data\processed_data\TMUS\8-K_2024-10-23.md'


2025-11-14 17:45:08,669 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:45:08,670 - ERROR - Input document 8-K_2024-12-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:45:08,671 - INFO - Going to convert document batch...
2025-11-14 17:45:08,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:08,735 - INFO - Going to convert document batch...
2025-11-14 17:45:08,736 - INFO - Processing document 8-K_2025-01

Converted 'data\edgar_documents\TMUS\8-K_2024-12-10' --> 'data\processed_data\TMUS\8-K_2024-12-10.md'
Error processing data\edgar_documents\TMUS\8-K_2024-12-13: File format not allowed: data\edgar_documents\TMUS\8-K_2024-12-13


2025-11-14 17:45:08,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:08,861 - INFO - Going to convert document batch...
2025-11-14 17:45:08,862 - INFO - Processing document 8-K_2025-01-29
2025-11-14 17:45:08,897 - INFO - Finished converting document 8-K_2025-01-29 in 0.06 sec.
2025-11-14 17:45:08,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:08,964 - INFO - Going to convert document batch...
2025-11-14 17:45:08,965 - INFO - Processing document 8-K_2025-02-11


Converted 'data\edgar_documents\TMUS\8-K_2025-01-27' --> 'data\processed_data\TMUS\8-K_2025-01-27.md'
Converted 'data\edgar_documents\TMUS\8-K_2025-01-29' --> 'data\processed_data\TMUS\8-K_2025-01-29.md'


2025-11-14 17:45:09,014 - INFO - Finished converting document 8-K_2025-02-11 in 0.09 sec.
2025-11-14 17:45:09,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:09,092 - INFO - Going to convert document batch...
2025-11-14 17:45:09,093 - INFO - Processing document 8-K_2025-02-21
2025-11-14 17:45:09,146 - INFO - Finished converting document 8-K_2025-02-21 in 0.09 sec.
2025-11-14 17:45:09,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:09,234 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMUS\8-K_2025-02-11' --> 'data\processed_data\TMUS\8-K_2025-02-11.md'
Converted 'data\edgar_documents\TMUS\8-K_2025-02-21' --> 'data\processed_data\TMUS\8-K_2025-02-21.md'


2025-11-14 17:45:09,235 - INFO - Processing document 8-K_2025-03-21
2025-11-14 17:45:09,280 - INFO - Finished converting document 8-K_2025-03-21 in 0.11 sec.
2025-11-14 17:45:09,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:09,365 - INFO - Going to convert document batch...
2025-11-14 17:45:09,367 - INFO - Processing document 8-K_2025-03-27
2025-11-14 17:45:09,420 - INFO - Finished converting document 8-K_2025-03-27 in 0.11 sec.
2025-11-14 17:45:09,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:09,503 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TMUS\8-K_2025-03-21' --> 'data\processed_data\TMUS\8-K_2025-03-21.md'
Converted 'data\edgar_documents\TMUS\8-K_2025-03-27' --> 'data\processed_data\TMUS\8-K_2025-03-27.md'


2025-11-14 17:45:09,505 - INFO - Processing document 8-K_2025-04-03
2025-11-14 17:45:09,541 - INFO - Finished converting document 8-K_2025-04-03 in 0.09 sec.
2025-11-14 17:45:09,580 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:09,601 - INFO - Going to convert document batch...
2025-11-14 17:45:09,602 - INFO - Processing document 8-K_2025-04-11
2025-11-14 17:45:09,638 - INFO - Finished converting document 8-K_2025-04-11 in 0.08 sec.
2025-11-14 17:45:09,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:09,732 - INFO - Going to convert document batch...
2025-11-14 17:45:09,733 - INFO - Processing document 8-K_2025-04-24


Converted 'data\edgar_documents\TMUS\8-K_2025-04-03' --> 'data\processed_data\TMUS\8-K_2025-04-03.md'
Converted 'data\edgar_documents\TMUS\8-K_2025-04-11' --> 'data\processed_data\TMUS\8-K_2025-04-11.md'


2025-11-14 17:45:09,804 - INFO - Finished converting document 8-K_2025-04-24 in 0.14 sec.
2025-11-14 17:45:09,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:09,918 - INFO - Going to convert document batch...
2025-11-14 17:45:09,919 - INFO - Processing document 8-K_2025-06-10
2025-11-14 17:45:09,978 - INFO - Finished converting document 8-K_2025-06-10 in 0.12 sec.
2025-11-14 17:45:10,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\8-K_2025-04-24' --> 'data\processed_data\TMUS\8-K_2025-04-24.md'
Converted 'data\edgar_documents\TMUS\8-K_2025-06-10' --> 'data\processed_data\TMUS\8-K_2025-06-10.md'


2025-11-14 17:45:10,055 - INFO - Going to convert document batch...
2025-11-14 17:45:10,056 - INFO - Processing document 8-K_2025-06-16
2025-11-14 17:45:10,178 - INFO - Finished converting document 8-K_2025-06-16 in 0.17 sec.
2025-11-14 17:45:10,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:10,264 - INFO - Going to convert document batch...
2025-11-14 17:45:10,266 - INFO - Processing document 8-K_2025-07-02
2025-11-14 17:45:10,306 - INFO - Finished converting document 8-K_2025-07-02 in 0.08 sec.
2025-11-14 17:45:10,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:10,364 - INFO - Going to convert document batch...
2025-11-14 17:45:10,364 - INFO - Processing document 8-K_2025-07-23


Converted 'data\edgar_documents\TMUS\8-K_2025-06-16' --> 'data\processed_data\TMUS\8-K_2025-06-16.md'
Converted 'data\edgar_documents\TMUS\8-K_2025-07-02' --> 'data\processed_data\TMUS\8-K_2025-07-02.md'


2025-11-14 17:45:10,402 - INFO - Finished converting document 8-K_2025-07-23 in 0.08 sec.
2025-11-14 17:45:10,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:10,522 - INFO - Going to convert document batch...
2025-11-14 17:45:10,523 - INFO - Processing document 8-K_2025-08-05
2025-11-14 17:45:10,576 - INFO - Finished converting document 8-K_2025-08-05 in 0.16 sec.


Converted 'data\edgar_documents\TMUS\8-K_2025-07-23' --> 'data\processed_data\TMUS\8-K_2025-07-23.md'


2025-11-14 17:45:10,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:10,688 - INFO - Going to convert document batch...
2025-11-14 17:45:10,689 - INFO - Processing document 8-K_2025-08-25
2025-11-14 17:45:10,727 - INFO - Finished converting document 8-K_2025-08-25 in 0.09 sec.
2025-11-14 17:45:10,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TMUS\8-K_2025-08-05' --> 'data\processed_data\TMUS\8-K_2025-08-05.md'
Converted 'data\edgar_documents\TMUS\8-K_2025-08-25' --> 'data\processed_data\TMUS\8-K_2025-08-25.md'


2025-11-14 17:45:10,839 - INFO - Going to convert document batch...
2025-11-14 17:45:10,841 - INFO - Processing document 8-K_2025-09-04
2025-11-14 17:45:10,882 - INFO - Finished converting document 8-K_2025-09-04 in 0.11 sec.
2025-11-14 17:45:10,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:10,976 - INFO - Going to convert document batch...
2025-11-14 17:45:10,977 - INFO - Processing document 8-K_2025-09-22
2025-11-14 17:45:11,084 - INFO - Finished converting document 8-K_2025-09-22 in 0.17 sec.


Converted 'data\edgar_documents\TMUS\8-K_2025-09-04' --> 'data\processed_data\TMUS\8-K_2025-09-04.md'


2025-11-14 17:45:11,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:11,189 - INFO - Going to convert document batch...
2025-11-14 17:45:11,190 - INFO - Processing document 8-K_2025-09-24
2025-11-14 17:45:11,227 - INFO - Finished converting document 8-K_2025-09-24 in 0.08 sec.
2025-11-14 17:45:11,277 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:45:11,278 - ERROR - Input document 8-K_2025-10-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <I

Converted 'data\edgar_documents\TMUS\8-K_2025-09-22' --> 'data\processed_data\TMUS\8-K_2025-09-22.md'
Converted 'data\edgar_documents\TMUS\8-K_2025-09-24' --> 'data\processed_data\TMUS\8-K_2025-09-24.md'
Error processing data\edgar_documents\TMUS\8-K_2025-10-09: File format not allowed: data\edgar_documents\TMUS\8-K_2025-10-09


2025-11-14 17:45:11,327 - INFO - Processing document 8-K_2025-10-23
2025-11-14 17:45:11,365 - INFO - Finished converting document 8-K_2025-10-23 in 0.08 sec.
2025-11-14 17:45:11,439 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:45:11,440 - ERROR - Input document DEF-14A_2023-04-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:45:11,444 - INFO - Going to convert document batch...
2025-11-14 17:45:11,505 - INFO - detected formats:

Converted 'data\edgar_documents\TMUS\8-K_2025-10-23' --> 'data\processed_data\TMUS\8-K_2025-10-23.md'
Error processing data\edgar_documents\TMUS\DEF-14A_2023-04-28: File format not allowed: data\edgar_documents\TMUS\DEF-14A_2023-04-28
Error processing data\edgar_documents\TMUS\DEF-14A_2024-04-26: File format not allowed: data\edgar_documents\TMUS\DEF-14A_2024-04-26
Error processing data\edgar_documents\TMUS\DEF-14A_2025-04-18: File format not allowed: data\edgar_documents\TMUS\DEF-14A_2025-04-18
Processed 234 new files. Errors: 20
Found 133 files to process in data\edgar_documents\TSLA


2025-11-14 17:45:11,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:45:15,536 - INFO - Going to convert document batch...
2025-11-14 17:45:15,537 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:45:15,540 - INFO - Processing document 10-K_2023-01-31
2025-11-14 17:45:22,410 - INFO - Finished converting document 10-K_2023-01-31 in 10.83 sec.
2025-11-14 17:45:23,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-K_2023-01-31' --> 'data\processed_data\TSLA\10-K_2023-01-31.md'


2025-11-14 17:45:26,016 - INFO - Going to convert document batch...
2025-11-14 17:45:26,017 - INFO - Processing document 10-K_2024-01-29
2025-11-14 17:45:29,715 - INFO - Finished converting document 10-K_2024-01-29 in 6.08 sec.
2025-11-14 17:45:31,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-K_2024-01-29' --> 'data\processed_data\TSLA\10-K_2024-01-29.md'


2025-11-14 17:45:32,994 - INFO - Going to convert document batch...
2025-11-14 17:45:32,995 - INFO - Processing document 10-K_2025-01-30
2025-11-14 17:45:37,694 - INFO - Finished converting document 10-K_2025-01-30 in 6.27 sec.
2025-11-14 17:45:39,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-K_2025-01-30' --> 'data\processed_data\TSLA\10-K_2025-01-30.md'


2025-11-14 17:45:40,000 - INFO - Going to convert document batch...
2025-11-14 17:45:40,001 - INFO - Processing document 10-K_2025-04-30
2025-11-14 17:45:50,606 - INFO - Finished converting document 10-K_2025-04-30 in 11.33 sec.
2025-11-14 17:45:51,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-K_2025-04-30' --> 'data\processed_data\TSLA\10-K_2025-04-30.md'


2025-11-14 17:45:54,182 - INFO - Going to convert document batch...
2025-11-14 17:45:54,183 - INFO - Processing document 10-Q_2023-04-24
2025-11-14 17:45:56,108 - INFO - Finished converting document 10-Q_2023-04-24 in 4.39 sec.
2025-11-14 17:45:56,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-Q_2023-04-24' --> 'data\processed_data\TSLA\10-Q_2023-04-24.md'


2025-11-14 17:45:59,711 - INFO - Going to convert document batch...
2025-11-14 17:45:59,713 - INFO - Processing document 10-Q_2023-07-24
2025-11-14 17:46:02,515 - INFO - Finished converting document 10-Q_2023-07-24 in 5.91 sec.
2025-11-14 17:46:03,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-Q_2023-07-24' --> 'data\processed_data\TSLA\10-Q_2023-07-24.md'


2025-11-14 17:46:04,108 - INFO - Going to convert document batch...
2025-11-14 17:46:04,110 - INFO - Processing document 10-Q_2023-10-23
2025-11-14 17:46:05,796 - INFO - Finished converting document 10-Q_2023-10-23 in 2.72 sec.
2025-11-14 17:46:06,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-Q_2023-10-23' --> 'data\processed_data\TSLA\10-Q_2023-10-23.md'


2025-11-14 17:46:07,388 - INFO - Going to convert document batch...
2025-11-14 17:46:07,390 - INFO - Processing document 10-Q_2024-04-24
2025-11-14 17:46:09,922 - INFO - Finished converting document 10-Q_2024-04-24 in 3.33 sec.
2025-11-14 17:46:10,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-Q_2024-04-24' --> 'data\processed_data\TSLA\10-Q_2024-04-24.md'


2025-11-14 17:46:11,649 - INFO - Going to convert document batch...
2025-11-14 17:46:11,651 - INFO - Processing document 10-Q_2024-07-24
2025-11-14 17:46:13,355 - INFO - Finished converting document 10-Q_2024-07-24 in 2.69 sec.
2025-11-14 17:46:14,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-Q_2024-07-24' --> 'data\processed_data\TSLA\10-Q_2024-07-24.md'


2025-11-14 17:46:15,333 - INFO - Going to convert document batch...
2025-11-14 17:46:15,336 - INFO - Processing document 10-Q_2024-10-24
2025-11-14 17:46:17,564 - INFO - Finished converting document 10-Q_2024-10-24 in 3.41 sec.
2025-11-14 17:46:18,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-Q_2024-10-24' --> 'data\processed_data\TSLA\10-Q_2024-10-24.md'


2025-11-14 17:46:18,928 - INFO - Going to convert document batch...
2025-11-14 17:46:18,929 - INFO - Processing document 10-Q_2025-04-23
2025-11-14 17:46:20,127 - INFO - Finished converting document 10-Q_2025-04-23 in 1.94 sec.
2025-11-14 17:46:20,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-Q_2025-04-23' --> 'data\processed_data\TSLA\10-Q_2025-04-23.md'


2025-11-14 17:46:21,588 - INFO - Going to convert document batch...
2025-11-14 17:46:21,589 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 17:46:24,028 - INFO - Finished converting document 10-Q_2025-07-24 in 3.27 sec.
2025-11-14 17:46:24,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\10-Q_2025-07-24' --> 'data\processed_data\TSLA\10-Q_2025-07-24.md'


2025-11-14 17:46:25,893 - INFO - Going to convert document batch...
2025-11-14 17:46:25,894 - INFO - Processing document 10-Q_2025-10-23
2025-11-14 17:46:27,498 - INFO - Finished converting document 10-Q_2025-10-23 in 2.62 sec.
2025-11-14 17:46:28,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:28,308 - INFO - Going to convert document batch...
2025-11-14 17:46:28,310 - INFO - Processing document 4_2023-01-03
2025-11-14 17:46:28,376 - INFO - Finished converting document 4_2023-01-03 in 0.11 sec.


Converted 'data\edgar_documents\TSLA\10-Q_2025-10-23' --> 'data\processed_data\TSLA\10-Q_2025-10-23.md'
Converted 'data\edgar_documents\TSLA\4_2023-01-03' --> 'data\processed_data\TSLA\4_2023-01-03.md'


2025-11-14 17:46:28,482 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:28,511 - INFO - Going to convert document batch...
2025-11-14 17:46:28,514 - INFO - Processing document 4_2023-01-06
2025-11-14 17:46:28,575 - INFO - Finished converting document 4_2023-01-06 in 0.12 sec.
2025-11-14 17:46:28,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:28,654 - INFO - Going to convert document batch...
2025-11-14 17:46:28,656 - INFO - Processing document 4_2023-01-31
2025-11-14 17:46:28,701 - INFO - Finished converting document 4_2023-01-31 in 0.09 sec.
2025-11-14 17:46:28,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2023-01-06' --> 'data\processed_data\TSLA\4_2023-01-06.md'
Converted 'data\edgar_documents\TSLA\4_2023-01-31' --> 'data\processed_data\TSLA\4_2023-01-31.md'


2025-11-14 17:46:28,793 - INFO - Going to convert document batch...
2025-11-14 17:46:28,795 - INFO - Processing document 4_2023-02-08
2025-11-14 17:46:28,857 - INFO - Finished converting document 4_2023-02-08 in 0.12 sec.
2025-11-14 17:46:28,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:28,978 - INFO - Going to convert document batch...
2025-11-14 17:46:28,981 - INFO - Processing document 4_2023-03-01
2025-11-14 17:46:29,025 - INFO - Finished converting document 4_2023-03-01 in 0.09 sec.
2025-11-14 17:46:29,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2023-02-08' --> 'data\processed_data\TSLA\4_2023-02-08.md'
Converted 'data\edgar_documents\TSLA\4_2023-03-01' --> 'data\processed_data\TSLA\4_2023-03-01.md'


2025-11-14 17:46:29,104 - INFO - Going to convert document batch...
2025-11-14 17:46:29,105 - INFO - Processing document 4_2023-03-07
2025-11-14 17:46:29,149 - INFO - Finished converting document 4_2023-03-07 in 0.08 sec.
2025-11-14 17:46:29,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:29,266 - INFO - Going to convert document batch...
2025-11-14 17:46:29,267 - INFO - Processing document 4_2023-03-10
2025-11-14 17:46:29,333 - INFO - Finished converting document 4_2023-03-10 in 0.12 sec.
2025-11-14 17:46:29,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2023-03-07' --> 'data\processed_data\TSLA\4_2023-03-07.md'
Converted 'data\edgar_documents\TSLA\4_2023-03-10' --> 'data\processed_data\TSLA\4_2023-03-10.md'


2025-11-14 17:46:29,406 - INFO - Going to convert document batch...
2025-11-14 17:46:29,406 - INFO - Processing document 4_2023-03-29
2025-11-14 17:46:29,453 - INFO - Finished converting document 4_2023-03-29 in 0.08 sec.
2025-11-14 17:46:29,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:29,558 - INFO - Going to convert document batch...
2025-11-14 17:46:29,559 - INFO - Processing document 4_2023-04-05
2025-11-14 17:46:29,653 - INFO - Finished converting document 4_2023-04-05 in 0.16 sec.


Converted 'data\edgar_documents\TSLA\4_2023-03-29' --> 'data\processed_data\TSLA\4_2023-03-29.md'


2025-11-14 17:46:29,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:29,779 - INFO - Going to convert document batch...
2025-11-14 17:46:29,781 - INFO - Processing document 4_2023-04-06
2025-11-14 17:46:29,836 - INFO - Finished converting document 4_2023-04-06 in 0.11 sec.
2025-11-14 17:46:29,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:29,912 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TSLA\4_2023-04-05' --> 'data\processed_data\TSLA\4_2023-04-05.md'
Converted 'data\edgar_documents\TSLA\4_2023-04-06' --> 'data\processed_data\TSLA\4_2023-04-06.md'


2025-11-14 17:46:29,913 - INFO - Processing document 4_2023-05-01
2025-11-14 17:46:29,954 - INFO - Finished converting document 4_2023-05-01 in 0.08 sec.
2025-11-14 17:46:30,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:30,059 - INFO - Going to convert document batch...
2025-11-14 17:46:30,061 - INFO - Processing document 4_2023-05-08
2025-11-14 17:46:30,104 - INFO - Finished converting document 4_2023-05-08 in 0.09 sec.
2025-11-14 17:46:30,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:30,209 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TSLA\4_2023-05-01' --> 'data\processed_data\TSLA\4_2023-05-01.md'
Converted 'data\edgar_documents\TSLA\4_2023-05-08' --> 'data\processed_data\TSLA\4_2023-05-08.md'


2025-11-14 17:46:30,211 - INFO - Processing document 4_2023-05-23
2025-11-14 17:46:30,270 - INFO - Finished converting document 4_2023-05-23 in 0.11 sec.
2025-11-14 17:46:30,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:30,360 - INFO - Going to convert document batch...
2025-11-14 17:46:30,361 - INFO - Processing document 4_2023-06-01
2025-11-14 17:46:30,426 - INFO - Finished converting document 4_2023-06-01 in 0.11 sec.
2025-11-14 17:46:30,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2023-05-23' --> 'data\processed_data\TSLA\4_2023-05-23.md'
Converted 'data\edgar_documents\TSLA\4_2023-06-01' --> 'data\processed_data\TSLA\4_2023-06-01.md'


2025-11-14 17:46:30,540 - INFO - Going to convert document batch...
2025-11-14 17:46:30,541 - INFO - Processing document 4_2023-06-07
2025-11-14 17:46:30,628 - INFO - Finished converting document 4_2023-06-07 in 0.14 sec.
2025-11-14 17:46:30,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:30,723 - INFO - Going to convert document batch...
2025-11-14 17:46:30,724 - INFO - Processing document 4_2023-06-13
2025-11-14 17:46:30,775 - INFO - Finished converting document 4_2023-06-13 in 0.08 sec.
2025-11-14 17:46:30,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:30,867 - INFO - Going to convert document batch...
2025-11-14 17:46:30,867 - INFO - Processing document 4_2023-06-16
2025-11-14 17:46:30,904 - INFO - Finished converting document 4_2023-06-16 in 0.08 sec.


Converted 'data\edgar_documents\TSLA\4_2023-06-07' --> 'data\processed_data\TSLA\4_2023-06-07.md'
Converted 'data\edgar_documents\TSLA\4_2023-06-13' --> 'data\processed_data\TSLA\4_2023-06-13.md'


2025-11-14 17:46:30,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:31,016 - INFO - Going to convert document batch...
2025-11-14 17:46:31,020 - INFO - Processing document 4_2023-06-29
2025-11-14 17:46:31,094 - INFO - Finished converting document 4_2023-06-29 in 0.14 sec.


Converted 'data\edgar_documents\TSLA\4_2023-06-16' --> 'data\processed_data\TSLA\4_2023-06-16.md'
Converted 'data\edgar_documents\TSLA\4_2023-06-29' --> 'data\processed_data\TSLA\4_2023-06-29.md'


2025-11-14 17:46:31,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:31,175 - INFO - Going to convert document batch...
2025-11-14 17:46:31,176 - INFO - Processing document 4_2023-07-06
2025-11-14 17:46:31,229 - INFO - Finished converting document 4_2023-07-06 in 0.09 sec.
2025-11-14 17:46:31,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:31,349 - INFO - Going to convert document batch...
2025-11-14 17:46:31,350 - INFO - Processing document 4_2023-07-07
2025-11-14 17:46:31,406 - INFO - Finished converting document 4_2023-07-07 in 0.11 sec.
2025-11-14 17:46:31,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2023-07-06' --> 'data\processed_data\TSLA\4_2023-07-06.md'
Converted 'data\edgar_documents\TSLA\4_2023-07-07' --> 'data\processed_data\TSLA\4_2023-07-07.md'


2025-11-14 17:46:31,516 - INFO - Going to convert document batch...
2025-11-14 17:46:31,516 - INFO - Processing document 4_2023-07-11
2025-11-14 17:46:31,559 - INFO - Finished converting document 4_2023-07-11 in 0.09 sec.
2025-11-14 17:46:31,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:31,639 - INFO - Going to convert document batch...
2025-11-14 17:46:31,640 - INFO - Processing document 4_2023-07-31
2025-11-14 17:46:31,680 - INFO - Finished converting document 4_2023-07-31 in 0.06 sec.
2025-11-14 17:46:31,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:31,779 - INFO - Going to convert document batch...
2025-11-14 17:46:31,782 - INFO - Processing document 4_2023-08-03


Converted 'data\edgar_documents\TSLA\4_2023-07-11' --> 'data\processed_data\TSLA\4_2023-07-11.md'
Converted 'data\edgar_documents\TSLA\4_2023-07-31' --> 'data\processed_data\TSLA\4_2023-07-31.md'


2025-11-14 17:46:31,847 - INFO - Finished converting document 4_2023-08-03 in 0.11 sec.
2025-11-14 17:46:31,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:31,949 - INFO - Going to convert document batch...
2025-11-14 17:46:31,949 - INFO - Processing document 4_2023-08-08
2025-11-14 17:46:31,989 - INFO - Finished converting document 4_2023-08-08 in 0.08 sec.
2025-11-14 17:46:32,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2023-08-03' --> 'data\processed_data\TSLA\4_2023-08-03.md'
Converted 'data\edgar_documents\TSLA\4_2023-08-08' --> 'data\processed_data\TSLA\4_2023-08-08.md'


2025-11-14 17:46:32,092 - INFO - Going to convert document batch...
2025-11-14 17:46:32,094 - INFO - Processing document 4_2023-08-30
2025-11-14 17:46:32,219 - INFO - Finished converting document 4_2023-08-30 in 0.19 sec.
2025-11-14 17:46:32,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:32,403 - INFO - Going to convert document batch...
2025-11-14 17:46:32,404 - INFO - Processing document 4_2023-09-06
2025-11-14 17:46:32,436 - INFO - Finished converting document 4_2023-09-06 in 0.08 sec.
2025-11-14 17:46:32,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:32,535 - INFO - Going to convert document batch...
2025-11-14 17:46:32,537 - INFO - Processing document 4_2023-09-07


Converted 'data\edgar_documents\TSLA\4_2023-08-30' --> 'data\processed_data\TSLA\4_2023-08-30.md'
Converted 'data\edgar_documents\TSLA\4_2023-09-06' --> 'data\processed_data\TSLA\4_2023-09-06.md'


2025-11-14 17:46:33,531 - INFO - Finished converting document 4_2023-09-07 in 1.06 sec.
2025-11-14 17:46:33,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:33,639 - INFO - Going to convert document batch...
2025-11-14 17:46:33,640 - INFO - Processing document 4_2023-09-29
2025-11-14 17:46:33,694 - INFO - Finished converting document 4_2023-09-29 in 0.11 sec.
2025-11-14 17:46:33,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:33,766 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TSLA\4_2023-09-07' --> 'data\processed_data\TSLA\4_2023-09-07.md'
Converted 'data\edgar_documents\TSLA\4_2023-09-29' --> 'data\processed_data\TSLA\4_2023-09-29.md'


2025-11-14 17:46:33,767 - INFO - Processing document 4_2023-10-11
2025-11-14 17:46:33,822 - INFO - Finished converting document 4_2023-10-11 in 0.08 sec.
2025-11-14 17:46:33,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:33,945 - INFO - Going to convert document batch...
2025-11-14 17:46:33,947 - INFO - Processing document 4_2023-10-31
2025-11-14 17:46:34,014 - INFO - Finished converting document 4_2023-10-31 in 0.12 sec.
2025-11-14 17:46:34,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:34,087 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TSLA\4_2023-10-11' --> 'data\processed_data\TSLA\4_2023-10-11.md'
Converted 'data\edgar_documents\TSLA\4_2023-10-31' --> 'data\processed_data\TSLA\4_2023-10-31.md'


2025-11-14 17:46:34,088 - INFO - Processing document 4_2023-12-01
2025-11-14 17:46:34,130 - INFO - Finished converting document 4_2023-12-01 in 0.08 sec.
2025-11-14 17:46:34,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:34,205 - INFO - Going to convert document batch...
2025-11-14 17:46:34,206 - INFO - Processing document 4_2023-12-07
2025-11-14 17:46:34,246 - INFO - Finished converting document 4_2023-12-07 in 0.08 sec.
2025-11-14 17:46:34,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:34,331 - INFO - Going to convert document batch...
2025-11-14 17:46:34,333 - INFO - Processing document 4_2023-12-18
2025-11-14 17:46:34,377 - INFO - Finished converting document 4_2023-12-18 in 0.09 sec.


Converted 'data\edgar_documents\TSLA\4_2023-12-01' --> 'data\processed_data\TSLA\4_2023-12-01.md'
Converted 'data\edgar_documents\TSLA\4_2023-12-07' --> 'data\processed_data\TSLA\4_2023-12-07.md'


2025-11-14 17:46:34,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:34,453 - INFO - Going to convert document batch...
2025-11-14 17:46:34,454 - INFO - Processing document 4_2024-02-02
2025-11-14 17:46:34,498 - INFO - Finished converting document 4_2024-02-02 in 0.08 sec.
2025-11-14 17:46:34,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:34,579 - INFO - Going to convert document batch...
2025-11-14 17:46:34,579 - INFO - Processing document 4_2024-02-23
2025-11-14 17:46:34,641 - INFO - Finished converting document 4_2024-02-23 in 0.11 sec.


Converted 'data\edgar_documents\TSLA\4_2023-12-18' --> 'data\processed_data\TSLA\4_2023-12-18.md'
Converted 'data\edgar_documents\TSLA\4_2024-02-02' --> 'data\processed_data\TSLA\4_2024-02-02.md'


2025-11-14 17:46:34,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:34,722 - INFO - Going to convert document batch...
2025-11-14 17:46:34,723 - INFO - Processing document 4_2024-03-04
2025-11-14 17:46:34,762 - INFO - Finished converting document 4_2024-03-04 in 0.08 sec.
2025-11-14 17:46:34,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:34,830 - INFO - Going to convert document batch...
2025-11-14 17:46:34,831 - INFO - Processing document 4_2024-03-07
2025-11-14 17:46:34,884 - INFO - Finished converting document 4_2024-03-07 in 0.08 sec.


Converted 'data\edgar_documents\TSLA\4_2024-02-23' --> 'data\processed_data\TSLA\4_2024-02-23.md'
Converted 'data\edgar_documents\TSLA\4_2024-03-04' --> 'data\processed_data\TSLA\4_2024-03-04.md'


2025-11-14 17:46:34,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:34,995 - INFO - Going to convert document batch...
2025-11-14 17:46:34,997 - INFO - Processing document 4_2024-03-14
2025-11-14 17:46:35,085 - INFO - Finished converting document 4_2024-03-14 in 0.14 sec.


Converted 'data\edgar_documents\TSLA\4_2024-03-07' --> 'data\processed_data\TSLA\4_2024-03-07.md'


2025-11-14 17:46:35,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:35,195 - INFO - Going to convert document batch...
2025-11-14 17:46:35,196 - INFO - Processing document 4_2024-04-03
2025-11-14 17:46:35,236 - INFO - Finished converting document 4_2024-04-03 in 0.08 sec.
2025-11-14 17:46:35,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:35,332 - INFO - Going to convert document batch...
2025-11-14 17:46:35,333 - INFO - Processing document 4_2024-05-07


Converted 'data\edgar_documents\TSLA\4_2024-03-14' --> 'data\processed_data\TSLA\4_2024-03-14.md'
Converted 'data\edgar_documents\TSLA\4_2024-04-03' --> 'data\processed_data\TSLA\4_2024-04-03.md'


2025-11-14 17:46:35,400 - INFO - Finished converting document 4_2024-05-07 in 0.11 sec.
2025-11-14 17:46:35,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:35,493 - INFO - Going to convert document batch...
2025-11-14 17:46:35,496 - INFO - Processing document 4_2024-06-05
2025-11-14 17:46:35,539 - INFO - Finished converting document 4_2024-06-05 in 0.08 sec.
2025-11-14 17:46:35,601 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:35,618 - INFO - Going to convert document batch...
2025-11-14 17:46:35,619 - INFO - Processing document 4_2024-06-07


Converted 'data\edgar_documents\TSLA\4_2024-05-07' --> 'data\processed_data\TSLA\4_2024-05-07.md'
Converted 'data\edgar_documents\TSLA\4_2024-06-05' --> 'data\processed_data\TSLA\4_2024-06-05.md'


2025-11-14 17:46:35,667 - INFO - Finished converting document 4_2024-06-07 in 0.08 sec.
2025-11-14 17:46:35,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:35,765 - INFO - Going to convert document batch...
2025-11-14 17:46:35,766 - INFO - Processing document 4_2024-07-29
2025-11-14 17:46:35,838 - INFO - Finished converting document 4_2024-07-29 in 0.14 sec.


Converted 'data\edgar_documents\TSLA\4_2024-06-07' --> 'data\processed_data\TSLA\4_2024-06-07.md'


2025-11-14 17:46:35,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:35,934 - INFO - Going to convert document batch...
2025-11-14 17:46:35,936 - INFO - Processing document 4_2024-09-09
2025-11-14 17:46:35,982 - INFO - Finished converting document 4_2024-09-09 in 0.09 sec.
2025-11-14 17:46:36,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2024-07-29' --> 'data\processed_data\TSLA\4_2024-07-29.md'
Converted 'data\edgar_documents\TSLA\4_2024-09-09' --> 'data\processed_data\TSLA\4_2024-09-09.md'


2025-11-14 17:46:36,077 - INFO - Going to convert document batch...
2025-11-14 17:46:36,080 - INFO - Processing document 4_2024-09-25
2025-11-14 17:46:36,128 - INFO - Finished converting document 4_2024-09-25 in 0.09 sec.
2025-11-14 17:46:36,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:36,200 - INFO - Going to convert document batch...
2025-11-14 17:46:36,200 - INFO - Processing document 4_2024-10-28
2025-11-14 17:46:36,241 - INFO - Finished converting document 4_2024-10-28 in 0.08 sec.
2025-11-14 17:46:36,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:36,352 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TSLA\4_2024-09-25' --> 'data\processed_data\TSLA\4_2024-09-25.md'
Converted 'data\edgar_documents\TSLA\4_2024-10-28' --> 'data\processed_data\TSLA\4_2024-10-28.md'


2025-11-14 17:46:36,354 - INFO - Processing document 4_2024-11-04
2025-11-14 17:46:36,399 - INFO - Finished converting document 4_2024-11-04 in 0.09 sec.
2025-11-14 17:46:36,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:36,490 - INFO - Going to convert document batch...
2025-11-14 17:46:36,491 - INFO - Processing document 4_2024-11-05
2025-11-14 17:46:36,549 - INFO - Finished converting document 4_2024-11-05 in 0.09 sec.


Converted 'data\edgar_documents\TSLA\4_2024-11-04' --> 'data\processed_data\TSLA\4_2024-11-04.md'
Converted 'data\edgar_documents\TSLA\4_2024-11-05' --> 'data\processed_data\TSLA\4_2024-11-05.md'


2025-11-14 17:46:36,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:36,688 - INFO - Going to convert document batch...
2025-11-14 17:46:36,692 - INFO - Processing document 4_2024-11-13
2025-11-14 17:46:36,798 - INFO - Finished converting document 4_2024-11-13 in 0.19 sec.
2025-11-14 17:46:36,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:36,956 - INFO - Going to convert document batch...
2025-11-14 17:46:36,958 - INFO - Processing document 4_2024-11-19
2025-11-14 17:46:37,069 - INFO - Finished converting document 4_2024-11-19 in 0.19 sec.


Converted 'data\edgar_documents\TSLA\4_2024-11-13' --> 'data\processed_data\TSLA\4_2024-11-13.md'


2025-11-14 17:46:37,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:37,222 - INFO - Going to convert document batch...
2025-11-14 17:46:37,223 - INFO - Processing document 4_2024-12-04
2025-11-14 17:46:37,290 - INFO - Finished converting document 4_2024-12-04 in 0.12 sec.
2025-11-14 17:46:37,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2024-11-19' --> 'data\processed_data\TSLA\4_2024-11-19.md'
Converted 'data\edgar_documents\TSLA\4_2024-12-04' --> 'data\processed_data\TSLA\4_2024-12-04.md'


2025-11-14 17:46:37,387 - INFO - Going to convert document batch...
2025-11-14 17:46:37,389 - INFO - Processing document 4_2024-12-06
2025-11-14 17:46:37,478 - INFO - Finished converting document 4_2024-12-06 in 0.12 sec.
2025-11-14 17:46:37,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:37,570 - INFO - Going to convert document batch...
2025-11-14 17:46:37,572 - INFO - Processing document 4_2024-12-09
2025-11-14 17:46:37,613 - INFO - Finished converting document 4_2024-12-09 in 0.08 sec.
2025-11-14 17:46:37,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:37,697 - INFO - Going to convert document batch...
2025-11-14 17:46:37,699 - INFO - Processing document 4_2024-12-13


Converted 'data\edgar_documents\TSLA\4_2024-12-06' --> 'data\processed_data\TSLA\4_2024-12-06.md'
Converted 'data\edgar_documents\TSLA\4_2024-12-09' --> 'data\processed_data\TSLA\4_2024-12-09.md'


2025-11-14 17:46:37,736 - INFO - Finished converting document 4_2024-12-13 in 0.08 sec.
2025-11-14 17:46:37,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:37,805 - INFO - Going to convert document batch...
2025-11-14 17:46:37,806 - INFO - Processing document 4_2024-12-31
2025-11-14 17:46:37,842 - INFO - Finished converting document 4_2024-12-31 in 0.08 sec.
2025-11-14 17:46:37,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:37,951 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TSLA\4_2024-12-13' --> 'data\processed_data\TSLA\4_2024-12-13.md'
Converted 'data\edgar_documents\TSLA\4_2024-12-31' --> 'data\processed_data\TSLA\4_2024-12-31.md'


2025-11-14 17:46:37,953 - INFO - Processing document 4_2025-01-08
2025-11-14 17:46:38,072 - INFO - Finished converting document 4_2025-01-08 in 0.19 sec.
2025-11-14 17:46:38,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:38,298 - INFO - Going to convert document batch...
2025-11-14 17:46:38,303 - INFO - Processing document 4_2025-02-05


Converted 'data\edgar_documents\TSLA\4_2025-01-08' --> 'data\processed_data\TSLA\4_2025-01-08.md'


2025-11-14 17:46:38,440 - INFO - Finished converting document 4_2025-02-05 in 0.22 sec.
2025-11-14 17:46:38,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:38,603 - INFO - Going to convert document batch...
2025-11-14 17:46:38,605 - INFO - Processing document 4_2025-02-10
2025-11-14 17:46:38,643 - INFO - Finished converting document 4_2025-02-10 in 0.08 sec.
2025-11-14 17:46:38,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:38,738 - INFO - Going to convert document batch...
2025-11-14 17:46:38,741 - INFO - Processing document 4_2025-03-05


Converted 'data\edgar_documents\TSLA\4_2025-02-05' --> 'data\processed_data\TSLA\4_2025-02-05.md'
Converted 'data\edgar_documents\TSLA\4_2025-02-10' --> 'data\processed_data\TSLA\4_2025-02-10.md'


2025-11-14 17:46:38,922 - INFO - Finished converting document 4_2025-03-05 in 0.23 sec.
2025-11-14 17:46:39,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:39,083 - INFO - Going to convert document batch...
2025-11-14 17:46:39,085 - INFO - Processing document 4_2025-03-06
2025-11-14 17:46:39,168 - INFO - Finished converting document 4_2025-03-06 in 0.14 sec.


Converted 'data\edgar_documents\TSLA\4_2025-03-05' --> 'data\processed_data\TSLA\4_2025-03-05.md'
Converted 'data\edgar_documents\TSLA\4_2025-03-06' --> 'data\processed_data\TSLA\4_2025-03-06.md'


2025-11-14 17:46:39,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:39,268 - INFO - Going to convert document batch...
2025-11-14 17:46:39,270 - INFO - Processing document 4_2025-03-12
2025-11-14 17:46:39,318 - INFO - Finished converting document 4_2025-03-12 in 0.08 sec.
2025-11-14 17:46:39,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:39,411 - INFO - Going to convert document batch...
2025-11-14 17:46:39,412 - INFO - Processing document 4_2025-04-09
2025-11-14 17:46:39,461 - INFO - Finished converting document 4_2025-04-09 in 0.09 sec.
2025-11-14 17:46:39,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:39,541 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TSLA\4_2025-03-12' --> 'data\processed_data\TSLA\4_2025-03-12.md'
Converted 'data\edgar_documents\TSLA\4_2025-04-09' --> 'data\processed_data\TSLA\4_2025-04-09.md'


2025-11-14 17:46:39,542 - INFO - Processing document 4_2025-04-28
2025-11-14 17:46:39,584 - INFO - Finished converting document 4_2025-04-28 in 0.08 sec.
2025-11-14 17:46:39,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:39,676 - INFO - Going to convert document batch...
2025-11-14 17:46:39,677 - INFO - Processing document 4_2025-05-01
2025-11-14 17:46:39,718 - INFO - Finished converting document 4_2025-05-01 in 0.08 sec.
2025-11-14 17:46:39,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2025-04-28' --> 'data\processed_data\TSLA\4_2025-04-28.md'
Converted 'data\edgar_documents\TSLA\4_2025-05-01' --> 'data\processed_data\TSLA\4_2025-05-01.md'


2025-11-14 17:46:39,861 - INFO - Going to convert document batch...
2025-11-14 17:46:39,864 - INFO - Processing document 4_2025-05-05
2025-11-14 17:46:39,987 - INFO - Finished converting document 4_2025-05-05 in 0.22 sec.
2025-11-14 17:46:40,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2025-05-05' --> 'data\processed_data\TSLA\4_2025-05-05.md'


2025-11-14 17:46:40,821 - INFO - Going to convert document batch...
2025-11-14 17:46:40,824 - INFO - Processing document 4_2025-05-08
2025-11-14 17:46:40,911 - INFO - Finished converting document 4_2025-05-08 in 0.84 sec.
2025-11-14 17:46:40,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:41,006 - INFO - Going to convert document batch...
2025-11-14 17:46:41,007 - INFO - Processing document 4_2025-05-13
2025-11-14 17:46:41,080 - INFO - Finished converting document 4_2025-05-13 in 0.12 sec.
2025-11-14 17:46:41,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\4_2025-05-08' --> 'data\processed_data\TSLA\4_2025-05-08.md'
Converted 'data\edgar_documents\TSLA\4_2025-05-13' --> 'data\processed_data\TSLA\4_2025-05-13.md'


2025-11-14 17:46:41,153 - INFO - Going to convert document batch...
2025-11-14 17:46:41,154 - INFO - Processing document 4_2025-05-20
2025-11-14 17:46:41,184 - INFO - Finished converting document 4_2025-05-20 in 0.08 sec.
2025-11-14 17:46:41,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:41,293 - INFO - Going to convert document batch...
2025-11-14 17:46:41,294 - INFO - Processing document 4_2025-05-29
2025-11-14 17:46:41,394 - INFO - Finished converting document 4_2025-05-29 in 0.16 sec.


Converted 'data\edgar_documents\TSLA\4_2025-05-20' --> 'data\processed_data\TSLA\4_2025-05-20.md'


2025-11-14 17:46:41,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:41,529 - INFO - Going to convert document batch...
2025-11-14 17:46:41,530 - INFO - Processing document 4_2025-06-04
2025-11-14 17:46:41,647 - INFO - Finished converting document 4_2025-06-04 in 0.17 sec.


Converted 'data\edgar_documents\TSLA\4_2025-05-29' --> 'data\processed_data\TSLA\4_2025-05-29.md'


2025-11-14 17:46:41,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:41,769 - INFO - Going to convert document batch...
2025-11-14 17:46:41,770 - INFO - Processing document 4_2025-06-09
2025-11-14 17:46:41,813 - INFO - Finished converting document 4_2025-06-09 in 0.08 sec.
2025-11-14 17:46:41,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:41,888 - INFO - Going to convert document batch...
2025-11-14 17:46:41,889 - INFO - Processing document 4_2025-06-16
2025-11-14 17:46:41,929 - INFO - Finished converting document 4_2025-06-16 in 0.06 sec.


Converted 'data\edgar_documents\TSLA\4_2025-06-04' --> 'data\processed_data\TSLA\4_2025-06-04.md'
Converted 'data\edgar_documents\TSLA\4_2025-06-09' --> 'data\processed_data\TSLA\4_2025-06-09.md'


2025-11-14 17:46:41,981 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:42,013 - INFO - Going to convert document batch...
2025-11-14 17:46:42,014 - INFO - Processing document 4_2025-07-09
2025-11-14 17:46:42,110 - INFO - Finished converting document 4_2025-07-09 in 0.14 sec.


Converted 'data\edgar_documents\TSLA\4_2025-06-16' --> 'data\processed_data\TSLA\4_2025-06-16.md'


2025-11-14 17:46:42,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:42,213 - INFO - Going to convert document batch...
2025-11-14 17:46:42,213 - INFO - Processing document 4_2025-07-15
2025-11-14 17:46:42,253 - INFO - Finished converting document 4_2025-07-15 in 0.08 sec.
2025-11-14 17:46:42,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:42,324 - INFO - Going to convert document batch...
2025-11-14 17:46:42,327 - INFO - Processing document 4_2025-08-04


Converted 'data\edgar_documents\TSLA\4_2025-07-09' --> 'data\processed_data\TSLA\4_2025-07-09.md'
Converted 'data\edgar_documents\TSLA\4_2025-07-15' --> 'data\processed_data\TSLA\4_2025-07-15.md'


2025-11-14 17:46:42,367 - INFO - Finished converting document 4_2025-08-04 in 0.06 sec.
2025-11-14 17:46:42,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:42,438 - INFO - Going to convert document batch...
2025-11-14 17:46:42,439 - INFO - Processing document 4_2025-08-28
2025-11-14 17:46:42,472 - INFO - Finished converting document 4_2025-08-28 in 0.06 sec.
2025-11-14 17:46:42,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:42,542 - INFO - Going to convert document batch...
2025-11-14 17:46:42,543 - INFO - Processing document 4_2025-09-09
2025-11-14 17:46:42,584 - INFO - Finished converting document 4_2025-09-09 in 0.08 sec.


Converted 'data\edgar_documents\TSLA\4_2025-08-04' --> 'data\processed_data\TSLA\4_2025-08-04.md'
Converted 'data\edgar_documents\TSLA\4_2025-08-28' --> 'data\processed_data\TSLA\4_2025-08-28.md'


2025-11-14 17:46:42,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:42,661 - INFO - Going to convert document batch...
2025-11-14 17:46:42,664 - INFO - Processing document 4_2025-09-12
2025-11-14 17:46:42,717 - INFO - Finished converting document 4_2025-09-12 in 0.09 sec.
2025-11-14 17:46:42,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:42,826 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TSLA\4_2025-09-09' --> 'data\processed_data\TSLA\4_2025-09-09.md'
Converted 'data\edgar_documents\TSLA\4_2025-09-12' --> 'data\processed_data\TSLA\4_2025-09-12.md'


2025-11-14 17:46:42,827 - INFO - Processing document 4_2025-09-15
2025-11-14 17:46:42,945 - INFO - Finished converting document 4_2025-09-15 in 0.19 sec.
2025-11-14 17:46:43,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:43,108 - INFO - Going to convert document batch...
2025-11-14 17:46:43,109 - INFO - Processing document 4_2025-09-17
2025-11-14 17:46:43,141 - INFO - Finished converting document 4_2025-09-17 in 0.06 sec.
2025-11-14 17:46:43,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:43,208 - INFO - Going to convert document batch...
2025-11-14 17:46:43,210 - INFO - Processing document 4_2025-11-10


Converted 'data\edgar_documents\TSLA\4_2025-09-15' --> 'data\processed_data\TSLA\4_2025-09-15.md'
Converted 'data\edgar_documents\TSLA\4_2025-09-17' --> 'data\processed_data\TSLA\4_2025-09-17.md'


2025-11-14 17:46:43,280 - INFO - Finished converting document 4_2025-11-10 in 0.11 sec.
2025-11-14 17:46:43,372 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:46:43,374 - ERROR - Input document 8-K_2023-01-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:46:43,374 - INFO - Going to convert document batch...
2025-11-14 17:46:43,409 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>

Converted 'data\edgar_documents\TSLA\4_2025-11-10' --> 'data\processed_data\TSLA\4_2025-11-10.md'
Error processing data\edgar_documents\TSLA\8-K_2023-01-03: File format not allowed: data\edgar_documents\TSLA\8-K_2023-01-03
Error processing data\edgar_documents\TSLA\8-K_2023-01-25: File format not allowed: data\edgar_documents\TSLA\8-K_2023-01-25
Error processing data\edgar_documents\TSLA\8-K_2023-04-03: File format not allowed: data\edgar_documents\TSLA\8-K_2023-04-03
Error processing data\edgar_documents\TSLA\8-K_2023-04-05: File format not allowed: data\edgar_documents\TSLA\8-K_2023-04-05
Error processing data\edgar_documents\TSLA\8-K_2023-04-19: File format not allowed: data\edgar_documents\TSLA\8-K_2023-04-19
Error processing data\edgar_documents\TSLA\8-K_2023-05-22: File format not allowed: data\edgar_documents\TSLA\8-K_2023-05-22


2025-11-14 17:46:43,543 - INFO - Going to convert document batch...
2025-11-14 17:46:43,544 - INFO - Processing document 8-K_2023-07-03
2025-11-14 17:46:43,572 - INFO - Finished converting document 8-K_2023-07-03 in 0.06 sec.
2025-11-14 17:46:43,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:43,634 - INFO - Going to convert document batch...
2025-11-14 17:46:43,635 - INFO - Processing document 8-K_2023-07-19
2025-11-14 17:46:43,673 - INFO - Finished converting document 8-K_2023-07-19 in 0.09 sec.
2025-11-14 17:46:43,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:43,756 - INFO - Going to convert document batch...
2025-11-14 17:46:43,757 - INFO - Processing document 8-K_2023-07-20


Converted 'data\edgar_documents\TSLA\8-K_2023-07-03' --> 'data\processed_data\TSLA\8-K_2023-07-03.md'
Converted 'data\edgar_documents\TSLA\8-K_2023-07-19' --> 'data\processed_data\TSLA\8-K_2023-07-19.md'


2025-11-14 17:46:43,794 - INFO - Finished converting document 8-K_2023-07-20 in 0.11 sec.
2025-11-14 17:46:43,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:43,867 - INFO - Going to convert document batch...
2025-11-14 17:46:43,868 - INFO - Processing document 8-K_2023-08-07
2025-11-14 17:46:43,895 - INFO - Finished converting document 8-K_2023-08-07 in 0.08 sec.
2025-11-14 17:46:43,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:43,959 - INFO - Going to convert document batch...
2025-11-14 17:46:43,960 - INFO - Processing document 8-K_2023-10-02
2025-11-14 17:46:43,994 - INFO - Finished converting document 8-K_2023-10-02 in 0.08 sec.


Converted 'data\edgar_documents\TSLA\8-K_2023-07-20' --> 'data\processed_data\TSLA\8-K_2023-07-20.md'
Converted 'data\edgar_documents\TSLA\8-K_2023-08-07' --> 'data\processed_data\TSLA\8-K_2023-08-07.md'


2025-11-14 17:46:44,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:44,051 - INFO - Going to convert document batch...
2025-11-14 17:46:44,053 - INFO - Processing document 8-K_2023-10-10
2025-11-14 17:46:44,095 - INFO - Finished converting document 8-K_2023-10-10 in 0.08 sec.
2025-11-14 17:46:44,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:44,161 - INFO - Going to convert document batch...
2025-11-14 17:46:44,163 - INFO - Processing document 8-K_2023-10-18
2025-11-14 17:46:44,195 - INFO - Finished converting document 8-K_2023-10-18 in 0.08 sec.


Converted 'data\edgar_documents\TSLA\8-K_2023-10-02' --> 'data\processed_data\TSLA\8-K_2023-10-02.md'
Converted 'data\edgar_documents\TSLA\8-K_2023-10-10' --> 'data\processed_data\TSLA\8-K_2023-10-10.md'


2025-11-14 17:46:44,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:44,250 - INFO - Going to convert document batch...
2025-11-14 17:46:44,251 - INFO - Processing document 8-K_2024-01-02
2025-11-14 17:46:44,278 - INFO - Finished converting document 8-K_2024-01-02 in 0.06 sec.
2025-11-14 17:46:44,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:44,351 - INFO - Going to convert document batch...
2025-11-14 17:46:44,353 - INFO - Processing document 8-K_2024-01-24
2025-11-14 17:46:44,387 - INFO - Finished converting document 8-K_2024-01-24 in 0.09 sec.


Converted 'data\edgar_documents\TSLA\8-K_2023-10-18' --> 'data\processed_data\TSLA\8-K_2023-10-18.md'
Converted 'data\edgar_documents\TSLA\8-K_2024-01-02' --> 'data\processed_data\TSLA\8-K_2024-01-02.md'


2025-11-14 17:46:44,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:44,454 - INFO - Going to convert document batch...
2025-11-14 17:46:44,456 - INFO - Processing document 8-K_2024-04-02
2025-11-14 17:46:44,487 - INFO - Finished converting document 8-K_2024-04-02 in 0.08 sec.
2025-11-14 17:46:44,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:44,547 - INFO - Going to convert document batch...
2025-11-14 17:46:44,548 - INFO - Processing document 8-K_2024-04-16
2025-11-14 17:46:44,574 - INFO - Finished converting document 8-K_2024-04-16 in 0.08 sec.


Converted 'data\edgar_documents\TSLA\8-K_2024-01-24' --> 'data\processed_data\TSLA\8-K_2024-01-24.md'
Converted 'data\edgar_documents\TSLA\8-K_2024-04-02' --> 'data\processed_data\TSLA\8-K_2024-04-02.md'
Converted 'data\edgar_documents\TSLA\8-K_2024-04-16' --> 'data\processed_data\TSLA\8-K_2024-04-16.md'


2025-11-14 17:46:44,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:44,644 - INFO - Going to convert document batch...
2025-11-14 17:46:44,646 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:46:44,679 - INFO - Finished converting document 8-K_2024-04-23 in 0.09 sec.
2025-11-14 17:46:44,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:44,873 - INFO - Going to convert document batch...
2025-11-14 17:46:44,874 - INFO - Processing document 8-K_2024-06-14


Converted 'data\edgar_documents\TSLA\8-K_2024-04-23' --> 'data\processed_data\TSLA\8-K_2024-04-23.md'


2025-11-14 17:46:44,955 - INFO - Finished converting document 8-K_2024-06-14 in 0.23 sec.
2025-11-14 17:46:45,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:45,051 - INFO - Going to convert document batch...
2025-11-14 17:46:45,051 - INFO - Processing document 8-K_2024-07-02
2025-11-14 17:46:45,095 - INFO - Finished converting document 8-K_2024-07-02 in 0.09 sec.
2025-11-14 17:46:45,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\8-K_2024-06-14' --> 'data\processed_data\TSLA\8-K_2024-06-14.md'
Converted 'data\edgar_documents\TSLA\8-K_2024-07-02' --> 'data\processed_data\TSLA\8-K_2024-07-02.md'


2025-11-14 17:46:45,196 - INFO - Going to convert document batch...
2025-11-14 17:46:45,199 - INFO - Processing document 8-K_2024-07-23
2025-11-14 17:46:45,254 - INFO - Finished converting document 8-K_2024-07-23 in 0.12 sec.
2025-11-14 17:46:45,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:45,315 - INFO - Going to convert document batch...
2025-11-14 17:46:45,317 - INFO - Processing document 8-K_2024-10-02
2025-11-14 17:46:45,363 - INFO - Finished converting document 8-K_2024-10-02 in 0.08 sec.
2025-11-14 17:46:45,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:45,423 - INFO - Going to convert document batch...
2025-11-14 17:46:45,423 - INFO - Processing document 8-K_2024-10-23
2025-11-14 17:46:45,449 - INFO - Finished converting document 8-K_2024-10-23 in 0.08 sec.


Converted 'data\edgar_documents\TSLA\8-K_2024-07-23' --> 'data\processed_data\TSLA\8-K_2024-07-23.md'
Converted 'data\edgar_documents\TSLA\8-K_2024-10-02' --> 'data\processed_data\TSLA\8-K_2024-10-02.md'


2025-11-14 17:46:45,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:45,541 - INFO - Going to convert document batch...
2025-11-14 17:46:45,543 - INFO - Processing document 8-K_2025-01-02
2025-11-14 17:46:45,589 - INFO - Finished converting document 8-K_2025-01-02 in 0.11 sec.
2025-11-14 17:46:45,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\8-K_2024-10-23' --> 'data\processed_data\TSLA\8-K_2024-10-23.md'
Converted 'data\edgar_documents\TSLA\8-K_2025-01-02' --> 'data\processed_data\TSLA\8-K_2025-01-02.md'


2025-11-14 17:46:45,710 - INFO - Going to convert document batch...
2025-11-14 17:46:45,711 - INFO - Processing document 8-K_2025-01-29
2025-11-14 17:46:45,759 - INFO - Finished converting document 8-K_2025-01-29 in 0.14 sec.
2025-11-14 17:46:45,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:45,808 - INFO - Going to convert document batch...
2025-11-14 17:46:45,809 - INFO - Processing document 8-K_2025-04-02
2025-11-14 17:46:45,845 - INFO - Finished converting document 8-K_2025-04-02 in 0.06 sec.
2025-11-14 17:46:45,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:45,896 - INFO - Going to convert document batch...
2025-11-14 17:46:45,897 - INFO - Processing document 8-K_2025-04-22
2025-11-14 17:46:45,927 - INFO - Finished converting document 8-K_2025-04-22 in 0.06 sec.
2025-11-14 17:46:45,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\8-K_2025-01-29' --> 'data\processed_data\TSLA\8-K_2025-01-29.md'
Converted 'data\edgar_documents\TSLA\8-K_2025-04-02' --> 'data\processed_data\TSLA\8-K_2025-04-02.md'
Converted 'data\edgar_documents\TSLA\8-K_2025-04-22' --> 'data\processed_data\TSLA\8-K_2025-04-22.md'


2025-11-14 17:46:45,993 - INFO - Going to convert document batch...
2025-11-14 17:46:45,996 - INFO - Processing document 8-K_2025-05-16
2025-11-14 17:46:46,048 - INFO - Finished converting document 8-K_2025-05-16 in 0.11 sec.
2025-11-14 17:46:46,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:46,135 - INFO - Going to convert document batch...
2025-11-14 17:46:46,137 - INFO - Processing document 8-K_2025-07-02
2025-11-14 17:46:46,188 - INFO - Finished converting document 8-K_2025-07-02 in 0.09 sec.
2025-11-14 17:46:46,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:46,237 - INFO - Going to convert document batch...
2025-11-14 17:46:46,238 - INFO - Processing document 8-K_2025-07-10
2025-11-14 17:46:46,265 - INFO - Finished converting document 8-K_2025-07-10 in 0.06 sec.


Converted 'data\edgar_documents\TSLA\8-K_2025-05-16' --> 'data\processed_data\TSLA\8-K_2025-05-16.md'
Converted 'data\edgar_documents\TSLA\8-K_2025-07-02' --> 'data\processed_data\TSLA\8-K_2025-07-02.md'
Converted 'data\edgar_documents\TSLA\8-K_2025-07-10' --> 'data\processed_data\TSLA\8-K_2025-07-10.md'


2025-11-14 17:46:46,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:46,331 - INFO - Going to convert document batch...
2025-11-14 17:46:46,334 - INFO - Processing document 8-K_2025-07-23
2025-11-14 17:46:46,392 - INFO - Finished converting document 8-K_2025-07-23 in 0.11 sec.
2025-11-14 17:46:46,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:46,474 - INFO - Going to convert document batch...
2025-11-14 17:46:46,475 - INFO - Processing document 8-K_2025-08-04
2025-11-14 17:46:46,553 - INFO - Finished converting document 8-K_2025-08-04 in 0.14 sec.


Converted 'data\edgar_documents\TSLA\8-K_2025-07-23' --> 'data\processed_data\TSLA\8-K_2025-07-23.md'


2025-11-14 17:46:46,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:46,699 - INFO - Going to convert document batch...
2025-11-14 17:46:46,702 - INFO - Processing document 8-K_2025-09-05
2025-11-14 17:46:46,755 - INFO - Finished converting document 8-K_2025-09-05 in 0.11 sec.
2025-11-14 17:46:46,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:46,807 - INFO - Going to convert document batch...
2025-11-14 17:46:46,813 - INFO - Processing document 8-K_2025-10-02


Converted 'data\edgar_documents\TSLA\8-K_2025-08-04' --> 'data\processed_data\TSLA\8-K_2025-08-04.md'
Converted 'data\edgar_documents\TSLA\8-K_2025-09-05' --> 'data\processed_data\TSLA\8-K_2025-09-05.md'


2025-11-14 17:46:46,864 - INFO - Finished converting document 8-K_2025-10-02 in 0.08 sec.
2025-11-14 17:46:46,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:46,916 - INFO - Going to convert document batch...
2025-11-14 17:46:46,917 - INFO - Processing document 8-K_2025-10-22
2025-11-14 17:46:46,971 - INFO - Finished converting document 8-K_2025-10-22 in 0.09 sec.
2025-11-14 17:46:47,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TSLA\8-K_2025-10-02' --> 'data\processed_data\TSLA\8-K_2025-10-02.md'
Converted 'data\edgar_documents\TSLA\8-K_2025-10-22' --> 'data\processed_data\TSLA\8-K_2025-10-22.md'


2025-11-14 17:46:47,123 - INFO - Going to convert document batch...
2025-11-14 17:46:47,127 - INFO - Processing document 8-K_2025-11-07
2025-11-14 17:46:47,340 - INFO - Finished converting document 8-K_2025-11-07 in 0.36 sec.
2025-11-14 17:46:47,426 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:46:47,427 - ERROR - Input document DEF-14A_2023-04-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:46:47,431 - INFO - Going to convert 

Converted 'data\edgar_documents\TSLA\8-K_2025-11-07' --> 'data\processed_data\TSLA\8-K_2025-11-07.md'
Error processing data\edgar_documents\TSLA\DEF-14A_2023-04-06: File format not allowed: data\edgar_documents\TSLA\DEF-14A_2023-04-06


2025-11-14 17:46:47,675 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:46:47,676 - ERROR - Input document DEF-14A_2025-09-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:46:47,683 - INFO - Going to convert document batch...


Error processing data\edgar_documents\TSLA\DEF-14A_2024-04-29: File format not allowed: data\edgar_documents\TSLA\DEF-14A_2024-04-29
Error processing data\edgar_documents\TSLA\DEF-14A_2025-09-17: File format not allowed: data\edgar_documents\TSLA\DEF-14A_2025-09-17
Processed 124 new files. Errors: 9
Found 102 files to process in data\edgar_documents\TXN


2025-11-14 17:46:47,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:46:49,227 - INFO - Going to convert document batch...
2025-11-14 17:46:49,228 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:46:49,229 - INFO - Processing document 10-K_2023-02-03
2025-11-14 17:46:51,159 - INFO - Finished converting document 10-K_2023-02-03 in 3.45 sec.
2025-11-14 17:46:52,389 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-K_2023-02-03' --> 'data\processed_data\TXN\10-K_2023-02-03.md'


2025-11-14 17:46:53,886 - INFO - Going to convert document batch...
2025-11-14 17:46:53,888 - INFO - Processing document 10-K_2024-02-02
2025-11-14 17:46:56,295 - INFO - Finished converting document 10-K_2024-02-02 in 3.95 sec.
2025-11-14 17:46:57,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-K_2024-02-02' --> 'data\processed_data\TXN\10-K_2024-02-02.md'


2025-11-14 17:46:59,093 - INFO - Going to convert document batch...
2025-11-14 17:46:59,094 - INFO - Processing document 10-K_2025-02-14
2025-11-14 17:47:01,099 - INFO - Finished converting document 10-K_2025-02-14 in 3.67 sec.
2025-11-14 17:47:01,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-K_2025-02-14' --> 'data\processed_data\TXN\10-K_2025-02-14.md'


2025-11-14 17:47:02,360 - INFO - Going to convert document batch...
2025-11-14 17:47:02,361 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 17:47:03,242 - INFO - Finished converting document 10-Q_2023-04-26 in 1.34 sec.
2025-11-14 17:47:03,975 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-Q_2023-04-26' --> 'data\processed_data\TXN\10-Q_2023-04-26.md'


2025-11-14 17:47:04,599 - INFO - Going to convert document batch...
2025-11-14 17:47:04,602 - INFO - Processing document 10-Q_2023-07-26
2025-11-14 17:47:05,750 - INFO - Finished converting document 10-Q_2023-07-26 in 1.88 sec.
2025-11-14 17:47:06,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-Q_2023-07-26' --> 'data\processed_data\TXN\10-Q_2023-07-26.md'


2025-11-14 17:47:08,006 - INFO - Going to convert document batch...
2025-11-14 17:47:08,008 - INFO - Processing document 10-Q_2023-10-25
2025-11-14 17:47:09,049 - INFO - Finished converting document 10-Q_2023-10-25 in 2.73 sec.
2025-11-14 17:47:09,587 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-Q_2023-10-25' --> 'data\processed_data\TXN\10-Q_2023-10-25.md'


2025-11-14 17:47:10,215 - INFO - Going to convert document batch...
2025-11-14 17:47:10,217 - INFO - Processing document 10-Q_2024-04-24
2025-11-14 17:47:11,124 - INFO - Finished converting document 10-Q_2024-04-24 in 1.56 sec.
2025-11-14 17:47:11,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-Q_2024-04-24' --> 'data\processed_data\TXN\10-Q_2024-04-24.md'


2025-11-14 17:47:12,327 - INFO - Going to convert document batch...
2025-11-14 17:47:12,330 - INFO - Processing document 10-Q_2024-07-24
2025-11-14 17:47:13,530 - INFO - Finished converting document 10-Q_2024-07-24 in 1.86 sec.
2025-11-14 17:47:14,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-Q_2024-07-24' --> 'data\processed_data\TXN\10-Q_2024-07-24.md'


2025-11-14 17:47:15,369 - INFO - Going to convert document batch...
2025-11-14 17:47:15,371 - INFO - Processing document 10-Q_2024-10-23
2025-11-14 17:47:16,725 - INFO - Finished converting document 10-Q_2024-10-23 in 2.06 sec.
2025-11-14 17:47:17,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-Q_2024-10-23' --> 'data\processed_data\TXN\10-Q_2024-10-23.md'


2025-11-14 17:47:17,873 - INFO - Going to convert document batch...
2025-11-14 17:47:17,875 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 17:47:18,979 - INFO - Finished converting document 10-Q_2025-04-24 in 1.75 sec.
2025-11-14 17:47:19,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-Q_2025-04-24' --> 'data\processed_data\TXN\10-Q_2025-04-24.md'


2025-11-14 17:47:20,836 - INFO - Going to convert document batch...
2025-11-14 17:47:20,837 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 17:47:22,025 - INFO - Finished converting document 10-Q_2025-07-29 in 2.56 sec.
2025-11-14 17:47:22,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\10-Q_2025-07-29' --> 'data\processed_data\TXN\10-Q_2025-07-29.md'


2025-11-14 17:47:23,331 - INFO - Going to convert document batch...
2025-11-14 17:47:23,333 - INFO - Processing document 10-Q_2025-10-23
2025-11-14 17:47:24,369 - INFO - Finished converting document 10-Q_2025-10-23 in 1.86 sec.
2025-11-14 17:47:24,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:24,928 - INFO - Going to convert document batch...
2025-11-14 17:47:24,929 - INFO - Processing document 4_2023-01-30
2025-11-14 17:47:24,970 - INFO - Finished converting document 4_2023-01-30 in 0.08 sec.
2025-11-14 17:47:25,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:25,037 - INFO - Going to convert document batch...
2025-11-14 17:47:25,038 - INFO - Processing document 4_2023-02-02
2025-11-14 17:47:25,073 - INFO - Finished converting document 4_2023-02-02 in 0.08 sec.


Converted 'data\edgar_documents\TXN\10-Q_2025-10-23' --> 'data\processed_data\TXN\10-Q_2025-10-23.md'
Converted 'data\edgar_documents\TXN\4_2023-01-30' --> 'data\processed_data\TXN\4_2023-01-30.md'


2025-11-14 17:47:25,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:25,150 - INFO - Going to convert document batch...
2025-11-14 17:47:25,151 - INFO - Processing document 4_2023-02-07
2025-11-14 17:47:25,222 - INFO - Finished converting document 4_2023-02-07 in 0.11 sec.
2025-11-14 17:47:25,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\4_2023-02-02' --> 'data\processed_data\TXN\4_2023-02-02.md'
Converted 'data\edgar_documents\TXN\4_2023-02-07' --> 'data\processed_data\TXN\4_2023-02-07.md'


2025-11-14 17:47:25,312 - INFO - Going to convert document batch...
2025-11-14 17:47:25,313 - INFO - Processing document 4_2023-02-15
2025-11-14 17:47:25,343 - INFO - Finished converting document 4_2023-02-15 in 0.08 sec.
2025-11-14 17:47:25,399 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:47:25,400 - ERROR - Input document 4_2023-03-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:47:25,401 - INFO - Going to convert document batch...
2025-11-14 17:47:25,423 - IN

Converted 'data\edgar_documents\TXN\4_2023-02-15' --> 'data\processed_data\TXN\4_2023-02-15.md'
Error processing data\edgar_documents\TXN\4_2023-03-07: File format not allowed: data\edgar_documents\TXN\4_2023-03-07
Error processing data\edgar_documents\TXN\4_2023-03-08: File format not allowed: data\edgar_documents\TXN\4_2023-03-08
Converted 'data\edgar_documents\TXN\4_2023-03-20' --> 'data\processed_data\TXN\4_2023-03-20.md'


2025-11-14 17:47:25,583 - INFO - Going to convert document batch...
2025-11-14 17:47:25,584 - INFO - Processing document 4_2023-04-05
2025-11-14 17:47:25,618 - INFO - Finished converting document 4_2023-04-05 in 0.06 sec.
2025-11-14 17:47:25,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:25,745 - INFO - Going to convert document batch...
2025-11-14 17:47:25,748 - INFO - Processing document 4_2023-05-01


Converted 'data\edgar_documents\TXN\4_2023-04-05' --> 'data\processed_data\TXN\4_2023-04-05.md'


2025-11-14 17:47:25,909 - INFO - Finished converting document 4_2023-05-01 in 0.25 sec.
2025-11-14 17:47:25,995 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:47:25,996 - ERROR - Input document 4_2023-05-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:47:25,998 - INFO - Going to convert document batch...
2025-11-14 17:47:26,025 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:47:26,026 - ERROR - Input document 4_2023-05-12 with forma

Converted 'data\edgar_documents\TXN\4_2023-05-01' --> 'data\processed_data\TXN\4_2023-05-01.md'
Error processing data\edgar_documents\TXN\4_2023-05-11: File format not allowed: data\edgar_documents\TXN\4_2023-05-11
Error processing data\edgar_documents\TXN\4_2023-05-12: File format not allowed: data\edgar_documents\TXN\4_2023-05-12


2025-11-14 17:47:26,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:26,199 - INFO - Going to convert document batch...
2025-11-14 17:47:26,200 - INFO - Processing document 4_2023-07-31
2025-11-14 17:47:26,239 - INFO - Finished converting document 4_2023-07-31 in 0.08 sec.
2025-11-14 17:47:26,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:26,307 - INFO - Going to convert document batch...
2025-11-14 17:47:26,308 - INFO - Processing document 4_2023-08-03
2025-11-14 17:47:26,351 - INFO - Finished converting document 4_2023-08-03 in 0.08 sec.


Converted 'data\edgar_documents\TXN\4_2023-06-20' --> 'data\processed_data\TXN\4_2023-06-20.md'
Converted 'data\edgar_documents\TXN\4_2023-07-31' --> 'data\processed_data\TXN\4_2023-07-31.md'


2025-11-14 17:47:26,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:26,420 - INFO - Going to convert document batch...
2025-11-14 17:47:26,421 - INFO - Processing document 4_2023-09-25
2025-11-14 17:47:26,458 - INFO - Finished converting document 4_2023-09-25 in 0.06 sec.
2025-11-14 17:47:26,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:26,519 - INFO - Going to convert document batch...
2025-11-14 17:47:26,520 - INFO - Processing document 4_2023-11-01
2025-11-14 17:47:26,554 - INFO - Finished converting document 4_2023-11-01 in 0.06 sec.


Converted 'data\edgar_documents\TXN\4_2023-08-03' --> 'data\processed_data\TXN\4_2023-08-03.md'
Converted 'data\edgar_documents\TXN\4_2023-09-25' --> 'data\processed_data\TXN\4_2023-09-25.md'
Converted 'data\edgar_documents\TXN\4_2023-11-01' --> 'data\processed_data\TXN\4_2023-11-01.md'


2025-11-14 17:47:26,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:26,627 - INFO - Going to convert document batch...
2025-11-14 17:47:26,628 - INFO - Processing document 4_2023-11-03
2025-11-14 17:47:26,662 - INFO - Finished converting document 4_2023-11-03 in 0.08 sec.
2025-11-14 17:47:26,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:26,732 - INFO - Going to convert document batch...
2025-11-14 17:47:26,733 - INFO - Processing document 4_2023-11-15
2025-11-14 17:47:26,773 - INFO - Finished converting document 4_2023-11-15 in 0.06 sec.
2025-11-14 17:47:26,833 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:26,849 - INFO - Going to convert document batch...
2025-11-14 17:47:26,850 - INFO - Processing document 4_2023-12-22
2025-11-14 17:47:26,911 - INFO - Finished converting document 4_2023-12-22 in 0.09 sec.


Converted 'data\edgar_documents\TXN\4_2023-11-03' --> 'data\processed_data\TXN\4_2023-11-03.md'
Converted 'data\edgar_documents\TXN\4_2023-11-15' --> 'data\processed_data\TXN\4_2023-11-15.md'


2025-11-14 17:47:26,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:27,005 - INFO - Going to convert document batch...
2025-11-14 17:47:27,006 - INFO - Processing document 4_2024-01-29
2025-11-14 17:47:27,100 - INFO - Finished converting document 4_2024-01-29 in 0.14 sec.
2025-11-14 17:47:27,158 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\4_2023-12-22' --> 'data\processed_data\TXN\4_2023-12-22.md'
Converted 'data\edgar_documents\TXN\4_2024-01-29' --> 'data\processed_data\TXN\4_2024-01-29.md'


2025-11-14 17:47:27,172 - INFO - Going to convert document batch...
2025-11-14 17:47:27,173 - INFO - Processing document 4_2024-02-02
2025-11-14 17:47:27,206 - INFO - Finished converting document 4_2024-02-02 in 0.06 sec.
2025-11-14 17:47:27,297 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:47:27,298 - ERROR - Input document 4_2024-02-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:47:27,299 - INFO - Going to convert document batch...
2025-11-14 17:47:27,323 - IN

Converted 'data\edgar_documents\TXN\4_2024-02-02' --> 'data\processed_data\TXN\4_2024-02-02.md'
Error processing data\edgar_documents\TXN\4_2024-02-05: File format not allowed: data\edgar_documents\TXN\4_2024-02-05
Error processing data\edgar_documents\TXN\4_2024-02-07: File format not allowed: data\edgar_documents\TXN\4_2024-02-07


2025-11-14 17:47:27,976 - INFO - Finished converting document 4_2024-03-05 in 0.64 sec.
2025-11-14 17:47:28,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:28,069 - INFO - Going to convert document batch...
2025-11-14 17:47:28,070 - INFO - Processing document 4_2024-03-26
2025-11-14 17:47:28,107 - INFO - Finished converting document 4_2024-03-26 in 0.08 sec.
2025-11-14 17:47:28,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:28,180 - INFO - Going to convert document batch...
2025-11-14 17:47:28,181 - INFO - Processing document 4_2024-05-01


Converted 'data\edgar_documents\TXN\4_2024-03-05' --> 'data\processed_data\TXN\4_2024-03-05.md'
Converted 'data\edgar_documents\TXN\4_2024-03-26' --> 'data\processed_data\TXN\4_2024-03-26.md'


2025-11-14 17:47:28,218 - INFO - Finished converting document 4_2024-05-01 in 0.08 sec.
2025-11-14 17:47:28,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:28,303 - INFO - Going to convert document batch...
2025-11-14 17:47:28,304 - INFO - Processing document 4_2024-05-03
2025-11-14 17:47:28,385 - INFO - Finished converting document 4_2024-05-03 in 0.14 sec.


Converted 'data\edgar_documents\TXN\4_2024-05-01' --> 'data\processed_data\TXN\4_2024-05-01.md'


2025-11-14 17:47:28,456 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:28,494 - INFO - Going to convert document batch...
2025-11-14 17:47:28,495 - INFO - Processing document 4_2024-05-06
2025-11-14 17:47:28,575 - INFO - Finished converting document 4_2024-05-06 in 0.14 sec.


Converted 'data\edgar_documents\TXN\4_2024-05-03' --> 'data\processed_data\TXN\4_2024-05-03.md'
Converted 'data\edgar_documents\TXN\4_2024-05-06' --> 'data\processed_data\TXN\4_2024-05-06.md'


2025-11-14 17:47:28,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:28,722 - INFO - Going to convert document batch...
2025-11-14 17:47:28,723 - INFO - Processing document 4_2024-05-15
2025-11-14 17:47:28,764 - INFO - Finished converting document 4_2024-05-15 in 0.14 sec.
2025-11-14 17:47:28,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:28,829 - INFO - Going to convert document batch...
2025-11-14 17:47:28,831 - INFO - Processing document 4_2024-06-25
2025-11-14 17:47:28,866 - INFO - Finished converting document 4_2024-06-25 in 0.06 sec.
2025-11-14 17:47:28,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:28,925 - INFO - Going to convert document batch...
2025-11-14 17:47:28,927 - INFO - Processing document 4_2024-08-01
2025-11-14 17:47:28,967 - INFO - Finished converting document 4_2024-08-01 in 0.08 sec.


Converted 'data\edgar_documents\TXN\4_2024-05-15' --> 'data\processed_data\TXN\4_2024-05-15.md'
Converted 'data\edgar_documents\TXN\4_2024-06-25' --> 'data\processed_data\TXN\4_2024-06-25.md'


2025-11-14 17:47:29,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:29,044 - INFO - Going to convert document batch...
2025-11-14 17:47:29,051 - INFO - Processing document 4_2024-08-26
2025-11-14 17:47:29,107 - INFO - Finished converting document 4_2024-08-26 in 0.11 sec.
2025-11-14 17:47:29,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:29,190 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TXN\4_2024-08-01' --> 'data\processed_data\TXN\4_2024-08-01.md'
Converted 'data\edgar_documents\TXN\4_2024-08-26' --> 'data\processed_data\TXN\4_2024-08-26.md'


2025-11-14 17:47:29,191 - INFO - Processing document 4_2024-08-27
2025-11-14 17:47:29,232 - INFO - Finished converting document 4_2024-08-27 in 0.08 sec.
2025-11-14 17:47:29,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:29,333 - INFO - Going to convert document batch...
2025-11-14 17:47:29,334 - INFO - Processing document 4_2024-08-28
2025-11-14 17:47:29,375 - INFO - Finished converting document 4_2024-08-28 in 0.09 sec.
2025-11-14 17:47:29,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:29,447 - INFO - Going to convert document batch...
2025-11-14 17:47:29,448 - INFO - Processing document 4_2024-08-29


Converted 'data\edgar_documents\TXN\4_2024-08-27' --> 'data\processed_data\TXN\4_2024-08-27.md'
Converted 'data\edgar_documents\TXN\4_2024-08-28' --> 'data\processed_data\TXN\4_2024-08-28.md'


2025-11-14 17:47:29,494 - INFO - Finished converting document 4_2024-08-29 in 0.08 sec.
2025-11-14 17:47:29,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:29,566 - INFO - Going to convert document batch...
2025-11-14 17:47:29,567 - INFO - Processing document 4_2024-09-03
2025-11-14 17:47:29,614 - INFO - Finished converting document 4_2024-09-03 in 0.08 sec.
2025-11-14 17:47:29,727 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\4_2024-08-29' --> 'data\processed_data\TXN\4_2024-08-29.md'
Converted 'data\edgar_documents\TXN\4_2024-09-03' --> 'data\processed_data\TXN\4_2024-09-03.md'


2025-11-14 17:47:29,790 - INFO - Going to convert document batch...
2025-11-14 17:47:29,793 - INFO - Processing document 4_2024-09-24
2025-11-14 17:47:29,846 - INFO - Finished converting document 4_2024-09-24 in 0.17 sec.
2025-11-14 17:47:29,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:29,913 - INFO - Going to convert document batch...
2025-11-14 17:47:29,914 - INFO - Processing document 4_2024-10-29
2025-11-14 17:47:29,954 - INFO - Finished converting document 4_2024-10-29 in 0.08 sec.
2025-11-14 17:47:30,002 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:30,016 - INFO - Going to convert document batch...
2025-11-14 17:47:30,016 - INFO - Processing document 4_2024-11-04
2025-11-14 17:47:30,048 - INFO - Finished converting document 4_2024-11-04 in 0.06 sec.


Converted 'data\edgar_documents\TXN\4_2024-09-24' --> 'data\processed_data\TXN\4_2024-09-24.md'
Converted 'data\edgar_documents\TXN\4_2024-10-29' --> 'data\processed_data\TXN\4_2024-10-29.md'


2025-11-14 17:47:30,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:30,114 - INFO - Going to convert document batch...
2025-11-14 17:47:30,116 - INFO - Processing document 4_2024-11-08
2025-11-14 17:47:30,152 - INFO - Finished converting document 4_2024-11-08 in 0.08 sec.
2025-11-14 17:47:30,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:30,224 - INFO - Going to convert document batch...
2025-11-14 17:47:30,225 - INFO - Processing document 4_2024-11-13


Converted 'data\edgar_documents\TXN\4_2024-11-04' --> 'data\processed_data\TXN\4_2024-11-04.md'
Converted 'data\edgar_documents\TXN\4_2024-11-08' --> 'data\processed_data\TXN\4_2024-11-08.md'


2025-11-14 17:47:30,271 - INFO - Finished converting document 4_2024-11-13 in 0.08 sec.
2025-11-14 17:47:30,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:30,351 - INFO - Going to convert document batch...
2025-11-14 17:47:30,352 - INFO - Processing document 4_2024-11-26
2025-11-14 17:47:30,391 - INFO - Finished converting document 4_2024-11-26 in 0.08 sec.
2025-11-14 17:47:30,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:30,463 - INFO - Going to convert document batch...
2025-11-14 17:47:30,464 - INFO - Processing document 4_2024-12-20
2025-11-14 17:47:30,501 - INFO - Finished converting document 4_2024-12-20 in 0.08 sec.


Converted 'data\edgar_documents\TXN\4_2024-11-13' --> 'data\processed_data\TXN\4_2024-11-13.md'
Converted 'data\edgar_documents\TXN\4_2024-11-26' --> 'data\processed_data\TXN\4_2024-11-26.md'


2025-11-14 17:47:30,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:30,592 - INFO - Going to convert document batch...
2025-11-14 17:47:30,594 - INFO - Processing document 4_2025-01-29
2025-11-14 17:47:30,646 - INFO - Finished converting document 4_2025-01-29 in 0.09 sec.
2025-11-14 17:47:30,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:30,741 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TXN\4_2024-12-20' --> 'data\processed_data\TXN\4_2024-12-20.md'
Converted 'data\edgar_documents\TXN\4_2025-01-29' --> 'data\processed_data\TXN\4_2025-01-29.md'


2025-11-14 17:47:30,742 - INFO - Processing document 4_2025-01-30
2025-11-14 17:47:30,788 - INFO - Finished converting document 4_2025-01-30 in 0.08 sec.
2025-11-14 17:47:30,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:30,852 - INFO - Going to convert document batch...
2025-11-14 17:47:30,853 - INFO - Processing document 4_2025-02-03
2025-11-14 17:47:30,894 - INFO - Finished converting document 4_2025-02-03 in 0.06 sec.
2025-11-14 17:47:30,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:30,974 - INFO - Going to convert document batch...
2025-11-14 17:47:30,975 - INFO - Processing document 4_2025-02-05
2025-11-14 17:47:31,019 - INFO - Finished converting document 4_2025-02-05 in 0.08 sec.


Converted 'data\edgar_documents\TXN\4_2025-01-30' --> 'data\processed_data\TXN\4_2025-01-30.md'
Converted 'data\edgar_documents\TXN\4_2025-02-03' --> 'data\processed_data\TXN\4_2025-02-03.md'


2025-11-14 17:47:31,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:31,095 - INFO - Going to convert document batch...
2025-11-14 17:47:31,096 - INFO - Processing document 4_2025-02-19
2025-11-14 17:47:31,128 - INFO - Finished converting document 4_2025-02-19 in 0.06 sec.
2025-11-14 17:47:31,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:31,207 - INFO - Going to convert document batch...
2025-11-14 17:47:31,208 - INFO - Processing document 4_2025-02-20


Converted 'data\edgar_documents\TXN\4_2025-02-05' --> 'data\processed_data\TXN\4_2025-02-05.md'
Converted 'data\edgar_documents\TXN\4_2025-02-19' --> 'data\processed_data\TXN\4_2025-02-19.md'


2025-11-14 17:47:31,265 - INFO - Finished converting document 4_2025-02-20 in 0.11 sec.
2025-11-14 17:47:31,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:31,354 - INFO - Going to convert document batch...
2025-11-14 17:47:31,355 - INFO - Processing document 4_2025-02-25
2025-11-14 17:47:31,414 - INFO - Finished converting document 4_2025-02-25 in 0.09 sec.
2025-11-14 17:47:31,479 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:31,508 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\TXN\4_2025-02-20' --> 'data\processed_data\TXN\4_2025-02-20.md'
Converted 'data\edgar_documents\TXN\4_2025-02-25' --> 'data\processed_data\TXN\4_2025-02-25.md'


2025-11-14 17:47:31,509 - INFO - Processing document 4_2025-02-27
2025-11-14 17:47:31,571 - INFO - Finished converting document 4_2025-02-27 in 0.11 sec.
2025-11-14 17:47:31,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:31,682 - INFO - Going to convert document batch...
2025-11-14 17:47:31,684 - INFO - Processing document 4_2025-03-03
2025-11-14 17:47:31,769 - INFO - Finished converting document 4_2025-03-03 in 0.14 sec.


Converted 'data\edgar_documents\TXN\4_2025-02-27' --> 'data\processed_data\TXN\4_2025-02-27.md'


2025-11-14 17:47:31,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:31,902 - INFO - Going to convert document batch...
2025-11-14 17:47:31,904 - INFO - Processing document 4_2025-03-21
2025-11-14 17:47:31,962 - INFO - Finished converting document 4_2025-03-21 in 0.09 sec.
2025-11-14 17:47:32,062 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\TXN\4_2025-03-03' --> 'data\processed_data\TXN\4_2025-03-03.md'
Converted 'data\edgar_documents\TXN\4_2025-03-21' --> 'data\processed_data\TXN\4_2025-03-21.md'


2025-11-14 17:47:32,063 - ERROR - Input document 4_2025-05-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:47:32,065 - INFO - Going to convert document batch...
2025-11-14 17:47:32,089 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:47:32,090 - ERROR - Input document 4_2025-05-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\TXN\4_2025-05-20: File format not allowed: data\edgar_documents\TXN\4_2025-05-20
Error processing data\edgar_documents\TXN\4_2025-05-22: File format not allowed: data\edgar_documents\TXN\4_2025-05-22
Converted 'data\edgar_documents\TXN\4_2025-06-20' --> 'data\processed_data\TXN\4_2025-06-20.md'


2025-11-14 17:47:32,268 - INFO - Going to convert document batch...
2025-11-14 17:47:32,269 - INFO - Processing document 4_2025-08-27
2025-11-14 17:47:32,313 - INFO - Finished converting document 4_2025-08-27 in 0.09 sec.
2025-11-14 17:47:32,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:32,415 - INFO - Going to convert document batch...
2025-11-14 17:47:32,416 - INFO - Processing document 4_2025-09-22
2025-11-14 17:47:32,464 - INFO - Finished converting document 4_2025-09-22 in 0.11 sec.
2025-11-14 17:47:32,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:32,537 - INFO - Going to convert document batch...
2025-11-14 17:47:32,538 - INFO - Processing document 4_2025-10-30


Converted 'data\edgar_documents\TXN\4_2025-08-27' --> 'data\processed_data\TXN\4_2025-08-27.md'
Converted 'data\edgar_documents\TXN\4_2025-09-22' --> 'data\processed_data\TXN\4_2025-09-22.md'


2025-11-14 17:47:32,578 - INFO - Finished converting document 4_2025-10-30 in 0.08 sec.
2025-11-14 17:47:32,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:32,655 - INFO - Going to convert document batch...
2025-11-14 17:47:32,656 - INFO - Processing document 4_2025-11-03
2025-11-14 17:47:32,691 - INFO - Finished converting document 4_2025-11-03 in 0.06 sec.
2025-11-14 17:47:32,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:32,766 - INFO - Going to convert document batch...
2025-11-14 17:47:32,767 - INFO - Processing document 8-K_2023-01-20
2025-11-14 17:47:32,791 - INFO - Finished converting document 8-K_2023-01-20 in 0.06 sec.


Converted 'data\edgar_documents\TXN\4_2025-10-30' --> 'data\processed_data\TXN\4_2025-10-30.md'
Converted 'data\edgar_documents\TXN\4_2025-11-03' --> 'data\processed_data\TXN\4_2025-11-03.md'


2025-11-14 17:47:32,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:32,866 - INFO - Going to convert document batch...
2025-11-14 17:47:32,867 - INFO - Processing document 8-K_2023-01-24
2025-11-14 17:47:32,926 - INFO - Finished converting document 8-K_2023-01-24 in 0.11 sec.
2025-11-14 17:47:32,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\8-K_2023-01-20' --> 'data\processed_data\TXN\8-K_2023-01-20.md'
Converted 'data\edgar_documents\TXN\8-K_2023-01-24' --> 'data\processed_data\TXN\8-K_2023-01-24.md'


2025-11-14 17:47:33,026 - INFO - Going to convert document batch...
2025-11-14 17:47:33,027 - INFO - Processing document 8-K_2023-02-16
2025-11-14 17:47:33,057 - INFO - Finished converting document 8-K_2023-02-16 in 0.09 sec.
2025-11-14 17:47:33,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:33,119 - INFO - Going to convert document batch...
2025-11-14 17:47:33,120 - INFO - Processing document 8-K_2023-03-14
2025-11-14 17:47:33,159 - INFO - Finished converting document 8-K_2023-03-14 in 0.08 sec.
2025-11-14 17:47:33,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:33,228 - INFO - Going to convert document batch...
2025-11-14 17:47:33,229 - INFO - Processing document 8-K_2023-04-25
2025-11-14 17:47:33,276 - INFO - Finished converting document 8-K_2023-04-25 in 0.11 sec.


Converted 'data\edgar_documents\TXN\8-K_2023-02-16' --> 'data\processed_data\TXN\8-K_2023-02-16.md'
Converted 'data\edgar_documents\TXN\8-K_2023-03-14' --> 'data\processed_data\TXN\8-K_2023-03-14.md'


2025-11-14 17:47:33,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:33,387 - INFO - Going to convert document batch...
2025-11-14 17:47:33,391 - INFO - Processing document 8-K_2023-05-03
2025-11-14 17:47:33,482 - INFO - Finished converting document 8-K_2023-05-03 in 0.19 sec.


Converted 'data\edgar_documents\TXN\8-K_2023-04-25' --> 'data\processed_data\TXN\8-K_2023-04-25.md'


2025-11-14 17:47:33,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:33,617 - INFO - Going to convert document batch...
2025-11-14 17:47:33,618 - INFO - Processing document 8-K_2023-05-18
2025-11-14 17:47:33,653 - INFO - Finished converting document 8-K_2023-05-18 in 0.08 sec.
2025-11-14 17:47:33,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\8-K_2023-05-03' --> 'data\processed_data\TXN\8-K_2023-05-03.md'
Converted 'data\edgar_documents\TXN\8-K_2023-05-18' --> 'data\processed_data\TXN\8-K_2023-05-18.md'


2025-11-14 17:47:33,803 - INFO - Going to convert document batch...
2025-11-14 17:47:33,808 - INFO - Processing document 8-K_2023-07-25
2025-11-14 17:47:33,873 - INFO - Finished converting document 8-K_2023-07-25 in 0.20 sec.
2025-11-14 17:47:33,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:33,931 - INFO - Going to convert document batch...
2025-11-14 17:47:33,932 - INFO - Processing document 8-K_2023-09-21
2025-11-14 17:47:33,970 - INFO - Finished converting document 8-K_2023-09-21 in 0.08 sec.
2025-11-14 17:47:34,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:34,038 - INFO - Going to convert document batch...
2025-11-14 17:47:34,039 - INFO - Processing document 8-K_2023-10-24
2025-11-14 17:47:34,088 - INFO - Finished converting document 8-K_2023-10-24 in 0.11 sec.


Converted 'data\edgar_documents\TXN\8-K_2023-07-25' --> 'data\processed_data\TXN\8-K_2023-07-25.md'
Converted 'data\edgar_documents\TXN\8-K_2023-09-21' --> 'data\processed_data\TXN\8-K_2023-09-21.md'


2025-11-14 17:47:34,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:34,164 - INFO - Going to convert document batch...
2025-11-14 17:47:34,165 - INFO - Processing document 8-K_2024-01-12
2025-11-14 17:47:34,186 - INFO - Finished converting document 8-K_2024-01-12 in 0.08 sec.
2025-11-14 17:47:34,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:34,246 - INFO - Going to convert document batch...
2025-11-14 17:47:34,247 - INFO - Processing document 8-K_2024-01-23
2025-11-14 17:47:34,291 - INFO - Finished converting document 8-K_2024-01-23 in 0.08 sec.


Converted 'data\edgar_documents\TXN\8-K_2023-10-24' --> 'data\processed_data\TXN\8-K_2023-10-24.md'
Converted 'data\edgar_documents\TXN\8-K_2024-01-12' --> 'data\processed_data\TXN\8-K_2024-01-12.md'


2025-11-14 17:47:34,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:34,348 - INFO - Going to convert document batch...
2025-11-14 17:47:34,349 - INFO - Processing document 8-K_2024-02-08
2025-11-14 17:47:34,383 - INFO - Finished converting document 8-K_2024-02-08 in 0.06 sec.
2025-11-14 17:47:34,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:34,450 - INFO - Going to convert document batch...
2025-11-14 17:47:34,452 - INFO - Processing document 8-K_2024-02-20
2025-11-14 17:47:34,488 - INFO - Finished converting document 8-K_2024-02-20 in 0.08 sec.


Converted 'data\edgar_documents\TXN\8-K_2024-01-23' --> 'data\processed_data\TXN\8-K_2024-01-23.md'
Converted 'data\edgar_documents\TXN\8-K_2024-02-08' --> 'data\processed_data\TXN\8-K_2024-02-08.md'
Converted 'data\edgar_documents\TXN\8-K_2024-02-20' --> 'data\processed_data\TXN\8-K_2024-02-20.md'


2025-11-14 17:47:34,521 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:34,543 - INFO - Going to convert document batch...
2025-11-14 17:47:34,545 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:47:34,587 - INFO - Finished converting document 8-K_2024-04-23 in 0.08 sec.
2025-11-14 17:47:34,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:34,692 - INFO - Going to convert document batch...
2025-11-14 17:47:34,693 - INFO - Processing document 8-K_2024-04-26


Converted 'data\edgar_documents\TXN\8-K_2024-04-23' --> 'data\processed_data\TXN\8-K_2024-04-23.md'


2025-11-14 17:47:35,385 - INFO - Finished converting document 8-K_2024-04-26 in 0.77 sec.
2025-11-14 17:47:35,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:35,485 - INFO - Going to convert document batch...
2025-11-14 17:47:35,486 - INFO - Processing document 8-K_2024-07-23
2025-11-14 17:47:35,537 - INFO - Finished converting document 8-K_2024-07-23 in 0.08 sec.
2025-11-14 17:47:35,580 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:35,600 - INFO - Going to convert document batch...
2025-11-14 17:47:35,600 - INFO - Processing document 8-K_2024-09-19


Converted 'data\edgar_documents\TXN\8-K_2024-04-26' --> 'data\processed_data\TXN\8-K_2024-04-26.md'
Converted 'data\edgar_documents\TXN\8-K_2024-07-23' --> 'data\processed_data\TXN\8-K_2024-07-23.md'


2025-11-14 17:47:35,644 - INFO - Finished converting document 8-K_2024-09-19 in 0.08 sec.
2025-11-14 17:47:35,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:35,704 - INFO - Going to convert document batch...
2025-11-14 17:47:35,705 - INFO - Processing document 8-K_2024-10-22
2025-11-14 17:47:35,775 - INFO - Finished converting document 8-K_2024-10-22 in 0.09 sec.
2025-11-14 17:47:35,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:35,842 - INFO - Going to convert document batch...
2025-11-14 17:47:35,843 - INFO - Processing document 8-K_2025-01-23


Converted 'data\edgar_documents\TXN\8-K_2024-09-19' --> 'data\processed_data\TXN\8-K_2024-09-19.md'
Converted 'data\edgar_documents\TXN\8-K_2024-10-22' --> 'data\processed_data\TXN\8-K_2024-10-22.md'


2025-11-14 17:47:35,884 - INFO - Finished converting document 8-K_2025-01-23 in 0.08 sec.
2025-11-14 17:47:35,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:36,014 - INFO - Going to convert document batch...
2025-11-14 17:47:36,015 - INFO - Processing document 8-K_2025-04-18
2025-11-14 17:47:36,087 - INFO - Finished converting document 8-K_2025-04-18 in 0.16 sec.


Converted 'data\edgar_documents\TXN\8-K_2025-01-23' --> 'data\processed_data\TXN\8-K_2025-01-23.md'


2025-11-14 17:47:36,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:36,160 - INFO - Going to convert document batch...
2025-11-14 17:47:36,162 - INFO - Processing document 8-K_2025-04-23
2025-11-14 17:47:36,209 - INFO - Finished converting document 8-K_2025-04-23 in 0.09 sec.


Converted 'data\edgar_documents\TXN\8-K_2025-04-18' --> 'data\processed_data\TXN\8-K_2025-04-18.md'
Converted 'data\edgar_documents\TXN\8-K_2025-04-23' --> 'data\processed_data\TXN\8-K_2025-04-23.md'


2025-11-14 17:47:36,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:36,384 - INFO - Going to convert document batch...
2025-11-14 17:47:36,386 - INFO - Processing document 8-K_2025-05-23
2025-11-14 17:47:36,425 - INFO - Finished converting document 8-K_2025-05-23 in 0.17 sec.
2025-11-14 17:47:36,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:36,481 - INFO - Going to convert document batch...
2025-11-14 17:47:36,483 - INFO - Processing document 8-K_2025-07-22
2025-11-14 17:47:36,525 - INFO - Finished converting document 8-K_2025-07-22 in 0.09 sec.
2025-11-14 17:47:36,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:36,587 - INFO - Going to convert document batch...
2025-11-14 17:47:36,588 - INFO - Processing document 8-K_2025-09-18


Converted 'data\edgar_documents\TXN\8-K_2025-05-23' --> 'data\processed_data\TXN\8-K_2025-05-23.md'
Converted 'data\edgar_documents\TXN\8-K_2025-07-22' --> 'data\processed_data\TXN\8-K_2025-07-22.md'


2025-11-14 17:47:36,631 - INFO - Finished converting document 8-K_2025-09-18 in 0.08 sec.
2025-11-14 17:47:36,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:36,701 - INFO - Going to convert document batch...
2025-11-14 17:47:36,702 - INFO - Processing document 8-K_2025-10-16
2025-11-14 17:47:36,743 - INFO - Finished converting document 8-K_2025-10-16 in 0.08 sec.
2025-11-14 17:47:36,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:47:36,826 - INFO - Going to convert document batch...
2025-11-14 17:47:36,828 - INFO - Processing document 8-K_2025-10-21


Converted 'data\edgar_documents\TXN\8-K_2025-09-18' --> 'data\processed_data\TXN\8-K_2025-09-18.md'
Converted 'data\edgar_documents\TXN\8-K_2025-10-16' --> 'data\processed_data\TXN\8-K_2025-10-16.md'


2025-11-14 17:47:36,880 - INFO - Finished converting document 8-K_2025-10-21 in 0.11 sec.
2025-11-14 17:47:36,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\8-K_2025-10-21' --> 'data\processed_data\TXN\8-K_2025-10-21.md'


2025-11-14 17:47:37,704 - INFO - Going to convert document batch...
2025-11-14 17:47:37,705 - INFO - Processing document DEF-14A_2023-03-14
2025-11-14 17:47:39,449 - INFO - Finished converting document DEF-14A_2023-03-14 in 2.55 sec.
2025-11-14 17:47:40,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\DEF-14A_2023-03-14' --> 'data\processed_data\TXN\DEF-14A_2023-03-14.md'


2025-11-14 17:47:41,668 - INFO - Going to convert document batch...
2025-11-14 17:47:41,673 - INFO - Processing document DEF-14A_2024-03-12
2025-11-14 17:47:43,341 - INFO - Finished converting document DEF-14A_2024-03-12 in 3.11 sec.
2025-11-14 17:47:44,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\DEF-14A_2024-03-12' --> 'data\processed_data\TXN\DEF-14A_2024-03-12.md'


2025-11-14 17:47:45,047 - INFO - Going to convert document batch...
2025-11-14 17:47:45,049 - INFO - Processing document DEF-14A_2025-03-05
2025-11-14 17:47:46,816 - INFO - Finished converting document DEF-14A_2025-03-05 in 2.70 sec.
2025-11-14 17:47:47,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\TXN\DEF-14A_2025-03-05' --> 'data\processed_data\TXN\DEF-14A_2025-03-05.md'
Processed 94 new files. Errors: 8
Found 141 files to process in data\edgar_documents\UNH


2025-11-14 17:47:49,945 - INFO - Going to convert document batch...
2025-11-14 17:47:49,946 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:47:49,948 - INFO - Processing document 10-K_2023-02-24
2025-11-14 17:47:52,979 - INFO - Finished converting document 10-K_2023-02-24 in 5.38 sec.
2025-11-14 17:47:54,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-K_2023-02-24' --> 'data\processed_data\UNH\10-K_2023-02-24.md'


2025-11-14 17:47:56,058 - INFO - Going to convert document batch...
2025-11-14 17:47:56,059 - INFO - Processing document 10-K_2024-02-28
2025-11-14 17:47:59,260 - INFO - Finished converting document 10-K_2024-02-28 in 4.95 sec.
2025-11-14 17:48:00,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-K_2024-02-28' --> 'data\processed_data\UNH\10-K_2024-02-28.md'


2025-11-14 17:48:02,751 - INFO - Going to convert document batch...
2025-11-14 17:48:02,752 - INFO - Processing document 10-K_2025-02-27
2025-11-14 17:48:04,200 - INFO - Finished converting document 10-K_2025-02-27 in 3.53 sec.
2025-11-14 17:48:05,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-K_2025-02-27' --> 'data\processed_data\UNH\10-K_2025-02-27.md'


2025-11-14 17:48:06,151 - INFO - Going to convert document batch...
2025-11-14 17:48:06,152 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 17:48:06,697 - INFO - Finished converting document 10-Q_2023-05-03 in 1.27 sec.
2025-11-14 17:48:07,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-Q_2023-05-03' --> 'data\processed_data\UNH\10-Q_2023-05-03.md'


2025-11-14 17:48:07,396 - INFO - Going to convert document batch...
2025-11-14 17:48:07,397 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 17:48:08,053 - INFO - Finished converting document 10-Q_2023-08-02 in 1.08 sec.
2025-11-14 17:48:08,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-Q_2023-08-02' --> 'data\processed_data\UNH\10-Q_2023-08-02.md'


2025-11-14 17:48:09,110 - INFO - Going to convert document batch...
2025-11-14 17:48:09,111 - INFO - Processing document 10-Q_2023-11-06
2025-11-14 17:48:09,736 - INFO - Finished converting document 10-Q_2023-11-06 in 1.38 sec.
2025-11-14 17:48:10,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-Q_2023-11-06' --> 'data\processed_data\UNH\10-Q_2023-11-06.md'


2025-11-14 17:48:10,459 - INFO - Going to convert document batch...
2025-11-14 17:48:10,460 - INFO - Processing document 10-Q_2024-05-09
2025-11-14 17:48:11,017 - INFO - Finished converting document 10-Q_2024-05-09 in 0.89 sec.
2025-11-14 17:48:11,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-Q_2024-05-09' --> 'data\processed_data\UNH\10-Q_2024-05-09.md'


2025-11-14 17:48:11,978 - INFO - Going to convert document batch...
2025-11-14 17:48:11,979 - INFO - Processing document 10-Q_2024-08-09
2025-11-14 17:48:12,656 - INFO - Finished converting document 10-Q_2024-08-09 in 1.38 sec.
2025-11-14 17:48:13,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-Q_2024-08-09' --> 'data\processed_data\UNH\10-Q_2024-08-09.md'


2025-11-14 17:48:13,349 - INFO - Going to convert document batch...
2025-11-14 17:48:13,350 - INFO - Processing document 10-Q_2024-11-04
2025-11-14 17:48:13,994 - INFO - Finished converting document 10-Q_2024-11-04 in 1.00 sec.
2025-11-14 17:48:14,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-Q_2024-11-04' --> 'data\processed_data\UNH\10-Q_2024-11-04.md'


2025-11-14 17:48:14,902 - INFO - Going to convert document batch...
2025-11-14 17:48:14,904 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 17:48:15,368 - INFO - Finished converting document 10-Q_2025-05-07 in 1.05 sec.
2025-11-14 17:48:15,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-Q_2025-05-07' --> 'data\processed_data\UNH\10-Q_2025-05-07.md'


2025-11-14 17:48:16,040 - INFO - Going to convert document batch...
2025-11-14 17:48:16,041 - INFO - Processing document 10-Q_2025-08-11
2025-11-14 17:48:16,712 - INFO - Finished converting document 10-Q_2025-08-11 in 1.09 sec.
2025-11-14 17:48:17,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\10-Q_2025-08-11' --> 'data\processed_data\UNH\10-Q_2025-08-11.md'


2025-11-14 17:48:17,718 - INFO - Going to convert document batch...
2025-11-14 17:48:17,719 - INFO - Processing document 10-Q_2025-10-28
2025-11-14 17:48:18,370 - INFO - Finished converting document 10-Q_2025-10-28 in 1.34 sec.
2025-11-14 17:48:18,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:18,721 - INFO - Going to convert document batch...
2025-11-14 17:48:18,723 - INFO - Processing document 4_2023-01-05
2025-11-14 17:48:18,739 - INFO - Finished converting document 4_2023-01-05 in 0.03 sec.
2025-11-14 17:48:18,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:18,780 - INFO - Going to convert document batch...
2025-11-14 17:48:18,780 - INFO - Processing document 4_2023-02-15
2025-11-14 17:48:18,799 - INFO - Finished converting document 4_2023-02-15 in 0.03 sec.
2025-11-14 17:48:18,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:18,835 - INFO - Going to convert document batch...
2025-11-14 17:48:18,

Converted 'data\edgar_documents\UNH\10-Q_2025-10-28' --> 'data\processed_data\UNH\10-Q_2025-10-28.md'
Converted 'data\edgar_documents\UNH\4_2023-01-05' --> 'data\processed_data\UNH\4_2023-01-05.md'
Converted 'data\edgar_documents\UNH\4_2023-02-15' --> 'data\processed_data\UNH\4_2023-02-15.md'
Converted 'data\edgar_documents\UNH\4_2023-02-23' --> 'data\processed_data\UNH\4_2023-02-23.md'


2025-11-14 17:48:18,892 - INFO - Processing document 4_2023-02-27
2025-11-14 17:48:18,914 - INFO - Finished converting document 4_2023-02-27 in 0.03 sec.
2025-11-14 17:48:18,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:18,970 - INFO - Going to convert document batch...
2025-11-14 17:48:18,972 - INFO - Processing document 4_2023-03-23
2025-11-14 17:48:18,998 - INFO - Finished converting document 4_2023-03-23 in 0.06 sec.
2025-11-14 17:48:19,062 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:48:19,063 - ERROR - Input document 4_2023-03-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\UNH\4_2023-02-27' --> 'data\processed_data\UNH\4_2023-02-27.md'
Converted 'data\edgar_documents\UNH\4_2023-03-23' --> 'data\processed_data\UNH\4_2023-03-23.md'
Error processing data\edgar_documents\UNH\4_2023-03-24: File format not allowed: data\edgar_documents\UNH\4_2023-03-24
Converted 'data\edgar_documents\UNH\4_2023-04-05' --> 'data\processed_data\UNH\4_2023-04-05.md'


2025-11-14 17:48:19,152 - INFO - Going to convert document batch...
2025-11-14 17:48:19,153 - INFO - Processing document 4_2023-04-21
2025-11-14 17:48:19,173 - INFO - Finished converting document 4_2023-04-21 in 0.05 sec.
2025-11-14 17:48:19,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,221 - INFO - Going to convert document batch...
2025-11-14 17:48:19,222 - INFO - Processing document 4_2023-04-25
2025-11-14 17:48:19,247 - INFO - Finished converting document 4_2023-04-25 in 0.05 sec.
2025-11-14 17:48:19,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,303 - INFO - Going to convert document batch...
2025-11-14 17:48:19,304 - INFO - Processing document 4_2023-05-01
2025-11-14 17:48:19,321 - INFO - Finished converting document 4_2023-05-01 in 0.05 sec.
2025-11-14 17:48:19,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,365 - INFO - Going to convert document batch...
2025-11-14 17:48:19,366 - 

Converted 'data\edgar_documents\UNH\4_2023-04-21' --> 'data\processed_data\UNH\4_2023-04-21.md'
Converted 'data\edgar_documents\UNH\4_2023-04-25' --> 'data\processed_data\UNH\4_2023-04-25.md'
Converted 'data\edgar_documents\UNH\4_2023-05-01' --> 'data\processed_data\UNH\4_2023-05-01.md'


2025-11-14 17:48:19,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,423 - INFO - Going to convert document batch...
2025-11-14 17:48:19,424 - INFO - Processing document 4_2023-06-08
2025-11-14 17:48:19,441 - INFO - Finished converting document 4_2023-06-08 in 0.03 sec.
2025-11-14 17:48:19,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,507 - INFO - Going to convert document batch...
2025-11-14 17:48:19,508 - INFO - Processing document 4_2023-06-29
2025-11-14 17:48:19,534 - INFO - Finished converting document 4_2023-06-29 in 0.06 sec.
2025-11-14 17:48:19,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,581 - INFO - Going to convert document batch...
2025-11-14 17:48:19,582 - INFO - Processing document 4_2023-07-06
2025-11-14 17:48:19,601 - INFO - Finished converting document 4_2023-07-06 in 0.03 sec.


Converted 'data\edgar_documents\UNH\4_2023-06-07' --> 'data\processed_data\UNH\4_2023-06-07.md'
Converted 'data\edgar_documents\UNH\4_2023-06-08' --> 'data\processed_data\UNH\4_2023-06-08.md'
Converted 'data\edgar_documents\UNH\4_2023-06-29' --> 'data\processed_data\UNH\4_2023-06-29.md'


2025-11-14 17:48:19,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,646 - INFO - Going to convert document batch...
2025-11-14 17:48:19,647 - INFO - Processing document 4_2023-07-21
2025-11-14 17:48:19,669 - INFO - Finished converting document 4_2023-07-21 in 0.05 sec.
2025-11-14 17:48:19,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,714 - INFO - Going to convert document batch...
2025-11-14 17:48:19,715 - INFO - Processing document 4_2023-08-15
2025-11-14 17:48:19,734 - INFO - Finished converting document 4_2023-08-15 in 0.05 sec.
2025-11-14 17:48:19,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,776 - INFO - Going to convert document batch...
2025-11-14 17:48:19,777 - INFO - Processing document 4_2023-08-16
2025-11-14 17:48:19,798 - INFO - Finished converting document 4_2023-08-16 in 0.05 sec.


Converted 'data\edgar_documents\UNH\4_2023-07-06' --> 'data\processed_data\UNH\4_2023-07-06.md'
Converted 'data\edgar_documents\UNH\4_2023-07-21' --> 'data\processed_data\UNH\4_2023-07-21.md'
Converted 'data\edgar_documents\UNH\4_2023-08-15' --> 'data\processed_data\UNH\4_2023-08-15.md'


2025-11-14 17:48:19,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,838 - INFO - Going to convert document batch...
2025-11-14 17:48:19,838 - INFO - Processing document 4_2023-08-31
2025-11-14 17:48:19,857 - INFO - Finished converting document 4_2023-08-31 in 0.05 sec.
2025-11-14 17:48:19,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,930 - INFO - Going to convert document batch...
2025-11-14 17:48:19,931 - INFO - Processing document 4_2023-09-21
2025-11-14 17:48:19,948 - INFO - Finished converting document 4_2023-09-21 in 0.06 sec.
2025-11-14 17:48:19,981 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:19,987 - INFO - Going to convert document batch...
2025-11-14 17:48:19,988 - INFO - Processing document 4_2023-10-04
2025-11-14 17:48:20,005 - INFO - Finished converting document 4_2023-10-04 in 0.03 sec.


Converted 'data\edgar_documents\UNH\4_2023-08-16' --> 'data\processed_data\UNH\4_2023-08-16.md'
Converted 'data\edgar_documents\UNH\4_2023-08-31' --> 'data\processed_data\UNH\4_2023-08-31.md'
Converted 'data\edgar_documents\UNH\4_2023-09-21' --> 'data\processed_data\UNH\4_2023-09-21.md'


2025-11-14 17:48:20,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,044 - INFO - Going to convert document batch...
2025-11-14 17:48:20,045 - INFO - Processing document 4_2023-10-18
2025-11-14 17:48:20,065 - INFO - Finished converting document 4_2023-10-18 in 0.05 sec.
2025-11-14 17:48:20,114 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,127 - INFO - Going to convert document batch...
2025-11-14 17:48:20,128 - INFO - Processing document 4_2023-10-19
2025-11-14 17:48:20,156 - INFO - Finished converting document 4_2023-10-19 in 0.08 sec.
2025-11-14 17:48:20,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,200 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\UNH\4_2023-10-04' --> 'data\processed_data\UNH\4_2023-10-04.md'
Converted 'data\edgar_documents\UNH\4_2023-10-18' --> 'data\processed_data\UNH\4_2023-10-18.md'
Converted 'data\edgar_documents\UNH\4_2023-10-19' --> 'data\processed_data\UNH\4_2023-10-19.md'


2025-11-14 17:48:20,201 - INFO - Processing document 4_2023-11-08
2025-11-14 17:48:20,218 - INFO - Finished converting document 4_2023-11-08 in 0.05 sec.
2025-11-14 17:48:20,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,260 - INFO - Going to convert document batch...
2025-11-14 17:48:20,260 - INFO - Processing document 4_2023-11-20
2025-11-14 17:48:20,283 - INFO - Finished converting document 4_2023-11-20 in 0.05 sec.
2025-11-14 17:48:20,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,328 - INFO - Going to convert document batch...
2025-11-14 17:48:20,329 - INFO - Processing document 4_2023-11-27
2025-11-14 17:48:20,348 - INFO - Finished converting document 4_2023-11-27 in 0.05 sec.
2025-11-14 17:48:20,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,391 - INFO - Going to convert document batch...
2025-11-14 17:48:20,391 - INFO - Processing document 4_2023-12-07
2025-11-14 17:48:20,412 - IN

Converted 'data\edgar_documents\UNH\4_2023-11-08' --> 'data\processed_data\UNH\4_2023-11-08.md'
Converted 'data\edgar_documents\UNH\4_2023-11-20' --> 'data\processed_data\UNH\4_2023-11-20.md'
Converted 'data\edgar_documents\UNH\4_2023-11-27' --> 'data\processed_data\UNH\4_2023-11-27.md'
Converted 'data\edgar_documents\UNH\4_2023-12-07' --> 'data\processed_data\UNH\4_2023-12-07.md'


2025-11-14 17:48:20,460 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,476 - INFO - Going to convert document batch...
2025-11-14 17:48:20,477 - INFO - Processing document 4_2023-12-14
2025-11-14 17:48:20,494 - INFO - Finished converting document 4_2023-12-14 in 0.05 sec.
2025-11-14 17:48:20,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,540 - INFO - Going to convert document batch...
2025-11-14 17:48:20,541 - INFO - Processing document 4_2024-01-04
2025-11-14 17:48:20,559 - INFO - Finished converting document 4_2024-01-04 in 0.05 sec.
2025-11-14 17:48:20,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,598 - INFO - Going to convert document batch...
2025-11-14 17:48:20,599 - INFO - Processing document 4_2024-02-15
2025-11-14 17:48:20,618 - INFO - Finished converting document 4_2024-02-15 in 0.03 sec.
2025-11-14 17:48:20,649 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\UNH\4_2023-12-14' --> 'data\processed_data\UNH\4_2023-12-14.md'
Converted 'data\edgar_documents\UNH\4_2024-01-04' --> 'data\processed_data\UNH\4_2024-01-04.md'
Converted 'data\edgar_documents\UNH\4_2024-02-15' --> 'data\processed_data\UNH\4_2024-02-15.md'


2025-11-14 17:48:20,701 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.
2025-11-14 17:48:20,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,752 - INFO - Going to convert document batch...
2025-11-14 17:48:20,756 - INFO - Processing document 4_2024-02-23
2025-11-14 17:48:20,805 - INFO - Finished converting document 4_2024-02-23 in 0.06 sec.
2025-11-14 17:48:20,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,848 - INFO - Going to convert document batch...
2025-11-14 17:48:20,849 - INFO - Processing document 4_2024-02-26
2025-11-14 17:48:20,867 - INFO - Finished converting document 4_2024-02-26 in 0.03 sec.
2025-11-14 17:48:20,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:20,903 - INFO - Going to convert document batch...
2025-11-14 17:48:20,904 - INFO - Processing document 4_2024-03-12


Converted 'data\edgar_documents\UNH\4_2024-02-20' --> 'data\processed_data\UNH\4_2024-02-20.md'
Converted 'data\edgar_documents\UNH\4_2024-02-23' --> 'data\processed_data\UNH\4_2024-02-23.md'
Converted 'data\edgar_documents\UNH\4_2024-02-26' --> 'data\processed_data\UNH\4_2024-02-26.md'


2025-11-14 17:48:20,922 - INFO - Finished converting document 4_2024-03-12 in 0.05 sec.
2025-11-14 17:48:20,979 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:48:20,980 - ERROR - Input document 4_2024-03-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:48:20,981 - INFO - Going to convert document batch...
2025-11-14 17:48:20,998 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:48:20,999 - ERROR - Input document 4_2024-03-20 with forma

Converted 'data\edgar_documents\UNH\4_2024-03-12' --> 'data\processed_data\UNH\4_2024-03-12.md'
Error processing data\edgar_documents\UNH\4_2024-03-19: File format not allowed: data\edgar_documents\UNH\4_2024-03-19
Error processing data\edgar_documents\UNH\4_2024-03-20: File format not allowed: data\edgar_documents\UNH\4_2024-03-20
Converted 'data\edgar_documents\UNH\4_2024-03-21' --> 'data\processed_data\UNH\4_2024-03-21.md'


2025-11-14 17:48:21,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:21,143 - INFO - Going to convert document batch...
2025-11-14 17:48:21,143 - INFO - Processing document 4_2024-06-05
2025-11-14 17:48:21,165 - INFO - Finished converting document 4_2024-06-05 in 0.03 sec.
2025-11-14 17:48:21,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:21,230 - INFO - Going to convert document batch...
2025-11-14 17:48:21,231 - INFO - Processing document 4_2024-06-07
2025-11-14 17:48:21,274 - INFO - Finished converting document 4_2024-06-07 in 0.08 sec.
2025-11-14 17:48:21,314 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\4_2024-04-03' --> 'data\processed_data\UNH\4_2024-04-03.md'
Converted 'data\edgar_documents\UNH\4_2024-06-05' --> 'data\processed_data\UNH\4_2024-06-05.md'
Converted 'data\edgar_documents\UNH\4_2024-06-07' --> 'data\processed_data\UNH\4_2024-06-07.md'


2025-11-14 17:48:21,327 - INFO - Going to convert document batch...
2025-11-14 17:48:21,328 - INFO - Processing document 4_2024-06-10
2025-11-14 17:48:21,710 - INFO - Finished converting document 4_2024-06-10 in 0.41 sec.
2025-11-14 17:48:21,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:21,750 - INFO - Going to convert document batch...
2025-11-14 17:48:21,751 - INFO - Processing document 4_2024-06-11
2025-11-14 17:48:21,767 - INFO - Finished converting document 4_2024-06-11 in 0.03 sec.
2025-11-14 17:48:21,797 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:21,813 - INFO - Going to convert document batch...
2025-11-14 17:48:21,814 - INFO - Processing document 4_2024-06-14
2025-11-14 17:48:21,847 - INFO - Finished converting document 4_2024-06-14 in 0.06 sec.
2025-11-14 17:48:21,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:21,890 - INFO - Going to convert document batch...
2025-11-14 17:48:21,891 - 

Converted 'data\edgar_documents\UNH\4_2024-06-10' --> 'data\processed_data\UNH\4_2024-06-10.md'
Converted 'data\edgar_documents\UNH\4_2024-06-11' --> 'data\processed_data\UNH\4_2024-06-11.md'
Converted 'data\edgar_documents\UNH\4_2024-06-14' --> 'data\processed_data\UNH\4_2024-06-14.md'


2025-11-14 17:48:21,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:21,945 - INFO - Going to convert document batch...
2025-11-14 17:48:21,945 - INFO - Processing document 4_2024-07-02
2025-11-14 17:48:21,962 - INFO - Finished converting document 4_2024-07-02 in 0.03 sec.
2025-11-14 17:48:21,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,005 - INFO - Going to convert document batch...
2025-11-14 17:48:22,006 - INFO - Processing document 4_2024-07-19
2025-11-14 17:48:22,026 - INFO - Finished converting document 4_2024-07-19 in 0.05 sec.
2025-11-14 17:48:22,070 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:48:22,070 - ERROR - Input document 4_2024-07-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\UNH\4_2024-06-27' --> 'data\processed_data\UNH\4_2024-06-27.md'
Converted 'data\edgar_documents\UNH\4_2024-07-02' --> 'data\processed_data\UNH\4_2024-07-02.md'
Converted 'data\edgar_documents\UNH\4_2024-07-19' --> 'data\processed_data\UNH\4_2024-07-19.md'
Error processing data\edgar_documents\UNH\4_2024-07-23: File format not allowed: data\edgar_documents\UNH\4_2024-07-23
Error processing data\edgar_documents\UNH\4_2024-07-24: File format not allowed: data\edgar_documents\UNH\4_2024-07-24


2025-11-14 17:48:22,112 - INFO - Processing document 4_2024-09-10
2025-11-14 17:48:22,134 - INFO - Finished converting document 4_2024-09-10 in 0.03 sec.
2025-11-14 17:48:22,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,183 - INFO - Going to convert document batch...
2025-11-14 17:48:22,184 - INFO - Processing document 4_2024-09-18
2025-11-14 17:48:22,210 - INFO - Finished converting document 4_2024-09-18 in 0.05 sec.
2025-11-14 17:48:22,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,271 - INFO - Going to convert document batch...
2025-11-14 17:48:22,271 - INFO - Processing document 4_2024-09-26
2025-11-14 17:48:22,291 - INFO - Finished converting document 4_2024-09-26 in 0.05 sec.
2025-11-14 17:48:22,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\4_2024-09-10' --> 'data\processed_data\UNH\4_2024-09-10.md'
Converted 'data\edgar_documents\UNH\4_2024-09-18' --> 'data\processed_data\UNH\4_2024-09-18.md'
Converted 'data\edgar_documents\UNH\4_2024-09-26' --> 'data\processed_data\UNH\4_2024-09-26.md'


2025-11-14 17:48:22,354 - INFO - Going to convert document batch...
2025-11-14 17:48:22,355 - INFO - Processing document 4_2024-10-03
2025-11-14 17:48:22,373 - INFO - Finished converting document 4_2024-10-03 in 0.06 sec.
2025-11-14 17:48:22,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,415 - INFO - Going to convert document batch...
2025-11-14 17:48:22,416 - INFO - Processing document 4_2024-11-05
2025-11-14 17:48:22,435 - INFO - Finished converting document 4_2024-11-05 in 0.05 sec.
2025-11-14 17:48:22,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,476 - INFO - Going to convert document batch...
2025-11-14 17:48:22,476 - INFO - Processing document 4_2024-11-13
2025-11-14 17:48:22,500 - INFO - Finished converting document 4_2024-11-13 in 0.05 sec.
2025-11-14 17:48:22,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,539 - INFO - Going to convert document batch...
2025-11-14 17:48:22,540 - 

Converted 'data\edgar_documents\UNH\4_2024-10-03' --> 'data\processed_data\UNH\4_2024-10-03.md'
Converted 'data\edgar_documents\UNH\4_2024-11-05' --> 'data\processed_data\UNH\4_2024-11-05.md'
Converted 'data\edgar_documents\UNH\4_2024-11-13' --> 'data\processed_data\UNH\4_2024-11-13.md'


2025-11-14 17:48:22,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,598 - INFO - Going to convert document batch...
2025-11-14 17:48:22,599 - INFO - Processing document 4_2024-12-19
2025-11-14 17:48:22,616 - INFO - Finished converting document 4_2024-12-19 in 0.03 sec.
2025-11-14 17:48:22,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,654 - INFO - Going to convert document batch...
2025-11-14 17:48:22,655 - INFO - Processing document 4_2025-01-06
2025-11-14 17:48:22,674 - INFO - Finished converting document 4_2025-01-06 in 0.03 sec.
2025-11-14 17:48:22,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,712 - INFO - Going to convert document batch...
2025-11-14 17:48:22,713 - INFO - Processing document 4_2025-01-22
2025-11-14 17:48:22,731 - INFO - Finished converting document 4_2025-01-22 in 0.05 sec.
2025-11-14 17:48:22,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\4_2024-11-15' --> 'data\processed_data\UNH\4_2024-11-15.md'
Converted 'data\edgar_documents\UNH\4_2024-12-19' --> 'data\processed_data\UNH\4_2024-12-19.md'
Converted 'data\edgar_documents\UNH\4_2025-01-06' --> 'data\processed_data\UNH\4_2025-01-06.md'
Converted 'data\edgar_documents\UNH\4_2025-01-22' --> 'data\processed_data\UNH\4_2025-01-22.md'


2025-11-14 17:48:22,769 - INFO - Going to convert document batch...
2025-11-14 17:48:22,770 - INFO - Processing document 4_2025-02-07
2025-11-14 17:48:22,790 - INFO - Finished converting document 4_2025-02-07 in 0.03 sec.
2025-11-14 17:48:22,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,831 - INFO - Going to convert document batch...
2025-11-14 17:48:22,832 - INFO - Processing document 4_2025-02-18
2025-11-14 17:48:22,849 - INFO - Finished converting document 4_2025-02-18 in 0.03 sec.
2025-11-14 17:48:22,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,888 - INFO - Going to convert document batch...
2025-11-14 17:48:22,889 - INFO - Processing document 4_2025-02-24
2025-11-14 17:48:22,912 - INFO - Finished converting document 4_2025-02-24 in 0.05 sec.
2025-11-14 17:48:22,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:22,975 - INFO - Going to convert document batch...
2025-11-14 17:48:22,975 - 

Converted 'data\edgar_documents\UNH\4_2025-02-07' --> 'data\processed_data\UNH\4_2025-02-07.md'
Converted 'data\edgar_documents\UNH\4_2025-02-18' --> 'data\processed_data\UNH\4_2025-02-18.md'
Converted 'data\edgar_documents\UNH\4_2025-02-24' --> 'data\processed_data\UNH\4_2025-02-24.md'


2025-11-14 17:48:23,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,036 - INFO - Going to convert document batch...
2025-11-14 17:48:23,036 - INFO - Processing document 4_2025-04-03
2025-11-14 17:48:23,056 - INFO - Finished converting document 4_2025-04-03 in 0.03 sec.
2025-11-14 17:48:23,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,095 - INFO - Going to convert document batch...
2025-11-14 17:48:23,096 - INFO - Processing document 4_2025-05-16
2025-11-14 17:48:23,114 - INFO - Finished converting document 4_2025-05-16 in 0.03 sec.
2025-11-14 17:48:23,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,167 - INFO - Going to convert document batch...
2025-11-14 17:48:23,169 - INFO - Processing document 4_2025-05-22
2025-11-14 17:48:23,194 - INFO - Finished converting document 4_2025-05-22 in 0.05 sec.


Converted 'data\edgar_documents\UNH\4_2025-03-20' --> 'data\processed_data\UNH\4_2025-03-20.md'
Converted 'data\edgar_documents\UNH\4_2025-04-03' --> 'data\processed_data\UNH\4_2025-04-03.md'
Converted 'data\edgar_documents\UNH\4_2025-05-16' --> 'data\processed_data\UNH\4_2025-05-16.md'


2025-11-14 17:48:23,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,240 - INFO - Going to convert document batch...
2025-11-14 17:48:23,241 - INFO - Processing document 4_2025-06-04
2025-11-14 17:48:23,261 - INFO - Finished converting document 4_2025-06-04 in 0.05 sec.
2025-11-14 17:48:23,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,300 - INFO - Going to convert document batch...
2025-11-14 17:48:23,301 - INFO - Processing document 4_2025-06-05
2025-11-14 17:48:23,318 - INFO - Finished converting document 4_2025-06-05 in 0.03 sec.
2025-11-14 17:48:23,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,356 - INFO - Going to convert document batch...
2025-11-14 17:48:23,356 - INFO - Processing document 4_2025-06-09
2025-11-14 17:48:23,384 - INFO - Finished converting document 4_2025-06-09 in 0.05 sec.


Converted 'data\edgar_documents\UNH\4_2025-05-22' --> 'data\processed_data\UNH\4_2025-05-22.md'
Converted 'data\edgar_documents\UNH\4_2025-06-04' --> 'data\processed_data\UNH\4_2025-06-04.md'
Converted 'data\edgar_documents\UNH\4_2025-06-05' --> 'data\processed_data\UNH\4_2025-06-05.md'


2025-11-14 17:48:23,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,431 - INFO - Going to convert document batch...
2025-11-14 17:48:23,432 - INFO - Processing document 4_2025-06-12
2025-11-14 17:48:23,464 - INFO - Finished converting document 4_2025-06-12 in 0.06 sec.
2025-11-14 17:48:23,511 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:48:23,512 - ERROR - Input document 4_2025-06-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:48

Converted 'data\edgar_documents\UNH\4_2025-06-09' --> 'data\processed_data\UNH\4_2025-06-09.md'
Converted 'data\edgar_documents\UNH\4_2025-06-12' --> 'data\processed_data\UNH\4_2025-06-12.md'
Error processing data\edgar_documents\UNH\4_2025-06-17: File format not allowed: data\edgar_documents\UNH\4_2025-06-17
Error processing data\edgar_documents\UNH\4_2025-06-18: File format not allowed: data\edgar_documents\UNH\4_2025-06-18


2025-11-14 17:48:23,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,631 - INFO - Going to convert document batch...
2025-11-14 17:48:23,632 - INFO - Processing document 4_2025-07-02
2025-11-14 17:48:23,651 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 17:48:23,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,694 - INFO - Going to convert document batch...
2025-11-14 17:48:23,694 - INFO - Processing document 4_2025-09-04
2025-11-14 17:48:23,717 - INFO - Finished converting document 4_2025-09-04 in 0.05 sec.
2025-11-14 17:48:23,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,757 - INFO - Going to convert document batch...
2025-11-14 17:48:23,758 - INFO - Processing document 4_2025-09-15
2025-11-14 17:48:23,775 - INFO - Finished converting document 4_2025-09-15 in 0.03 sec.


Converted 'data\edgar_documents\UNH\4_2025-06-26' --> 'data\processed_data\UNH\4_2025-06-26.md'
Converted 'data\edgar_documents\UNH\4_2025-07-02' --> 'data\processed_data\UNH\4_2025-07-02.md'
Converted 'data\edgar_documents\UNH\4_2025-09-04' --> 'data\processed_data\UNH\4_2025-09-04.md'


2025-11-14 17:48:23,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,816 - INFO - Going to convert document batch...
2025-11-14 17:48:23,817 - INFO - Processing document 4_2025-09-25
2025-11-14 17:48:23,837 - INFO - Finished converting document 4_2025-09-25 in 0.03 sec.
2025-11-14 17:48:23,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,880 - INFO - Going to convert document batch...
2025-11-14 17:48:23,880 - INFO - Processing document 4_2025-10-03
2025-11-14 17:48:23,903 - INFO - Finished converting document 4_2025-10-03 in 0.05 sec.
2025-11-14 17:48:23,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,949 - INFO - Going to convert document batch...
2025-11-14 17:48:23,950 - INFO - Processing document 8-K_2023-01-13
2025-11-14 17:48:23,965 - INFO - Finished converting document 8-K_2023-01-13 in 0.05 sec.


Converted 'data\edgar_documents\UNH\4_2025-09-15' --> 'data\processed_data\UNH\4_2025-09-15.md'
Converted 'data\edgar_documents\UNH\4_2025-09-25' --> 'data\processed_data\UNH\4_2025-09-25.md'
Converted 'data\edgar_documents\UNH\4_2025-10-03' --> 'data\processed_data\UNH\4_2025-10-03.md'
Converted 'data\edgar_documents\UNH\8-K_2023-01-13' --> 'data\processed_data\UNH\8-K_2023-01-13.md'


2025-11-14 17:48:23,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:23,994 - INFO - Going to convert document batch...
2025-11-14 17:48:23,996 - INFO - Processing document 8-K_2023-03-28
2025-11-14 17:48:24,017 - INFO - Finished converting document 8-K_2023-03-28 in 0.05 sec.
2025-11-14 17:48:24,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,054 - INFO - Going to convert document batch...
2025-11-14 17:48:24,055 - INFO - Processing document 8-K_2023-04-14
2025-11-14 17:48:24,072 - INFO - Finished converting document 8-K_2023-04-14 in 0.03 sec.
2025-11-14 17:48:24,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,100 - INFO - Going to convert document batch...
2025-11-14 17:48:24,101 - INFO - Processing document 8-K_2023-04-24
2025-11-14 17:48:24,116 - INFO - Finished converting document 8-K_2023-04-24 in 0.03 sec.
2025-11-14 17:48:24,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\UNH\8-K_2023-03-28' --> 'data\processed_data\UNH\8-K_2023-03-28.md'
Converted 'data\edgar_documents\UNH\8-K_2023-04-14' --> 'data\processed_data\UNH\8-K_2023-04-14.md'
Converted 'data\edgar_documents\UNH\8-K_2023-04-24' --> 'data\processed_data\UNH\8-K_2023-04-24.md'
Converted 'data\edgar_documents\UNH\8-K_2023-04-28' --> 'data\processed_data\UNH\8-K_2023-04-28.md'


2025-11-14 17:48:24,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,242 - INFO - Going to convert document batch...
2025-11-14 17:48:24,243 - INFO - Processing document 8-K_2023-05-30
2025-11-14 17:48:24,258 - INFO - Finished converting document 8-K_2023-05-30 in 0.03 sec.
2025-11-14 17:48:24,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,299 - INFO - Going to convert document batch...
2025-11-14 17:48:24,300 - INFO - Processing document 8-K_2023-06-09
2025-11-14 17:48:24,330 - INFO - Finished converting document 8-K_2023-06-09 in 0.06 sec.
2025-11-14 17:48:24,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,370 - INFO - Going to convert document batch...
2025-11-14 17:48:24,371 - INFO - Processing document 8-K_2023-07-14
2025-11-14 17:48:24,386 - INFO - Finished converting document 8-K_2023-07-14 in 0.05 sec.
2025-11-14 17:48:24,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\8-K_2023-05-05' --> 'data\processed_data\UNH\8-K_2023-05-05.md'
Converted 'data\edgar_documents\UNH\8-K_2023-05-30' --> 'data\processed_data\UNH\8-K_2023-05-30.md'
Converted 'data\edgar_documents\UNH\8-K_2023-06-09' --> 'data\processed_data\UNH\8-K_2023-06-09.md'
Converted 'data\edgar_documents\UNH\8-K_2023-07-14' --> 'data\processed_data\UNH\8-K_2023-07-14.md'


2025-11-14 17:48:24,421 - INFO - Going to convert document batch...
2025-11-14 17:48:24,422 - INFO - Processing document 8-K_2023-09-22
2025-11-14 17:48:24,436 - INFO - Finished converting document 8-K_2023-09-22 in 0.05 sec.
2025-11-14 17:48:24,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,470 - INFO - Going to convert document batch...
2025-11-14 17:48:24,471 - INFO - Processing document 8-K_2023-10-13
2025-11-14 17:48:24,488 - INFO - Finished converting document 8-K_2023-10-13 in 0.05 sec.
2025-11-14 17:48:24,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,524 - INFO - Going to convert document batch...
2025-11-14 17:48:24,525 - INFO - Processing document 8-K_2023-11-03
2025-11-14 17:48:24,542 - INFO - Finished converting document 8-K_2023-11-03 in 0.05 sec.
2025-11-14 17:48:24,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,574 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\UNH\8-K_2023-09-22' --> 'data\processed_data\UNH\8-K_2023-09-22.md'
Converted 'data\edgar_documents\UNH\8-K_2023-10-13' --> 'data\processed_data\UNH\8-K_2023-10-13.md'
Converted 'data\edgar_documents\UNH\8-K_2023-11-03' --> 'data\processed_data\UNH\8-K_2023-11-03.md'
Converted 'data\edgar_documents\UNH\8-K_2023-11-22' --> 'data\processed_data\UNH\8-K_2023-11-22.md'


2025-11-14 17:48:24,623 - INFO - Processing document 8-K_2023-11-28
2025-11-14 17:48:24,638 - INFO - Finished converting document 8-K_2023-11-28 in 0.05 sec.
2025-11-14 17:48:24,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,669 - INFO - Going to convert document batch...
2025-11-14 17:48:24,670 - INFO - Processing document 8-K_2023-12-29
2025-11-14 17:48:24,685 - INFO - Finished converting document 8-K_2023-12-29 in 0.05 sec.
2025-11-14 17:48:24,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,713 - INFO - Going to convert document batch...
2025-11-14 17:48:24,714 - INFO - Processing document 8-K_2024-01-12
2025-11-14 17:48:24,729 - INFO - Finished converting document 8-K_2024-01-12 in 0.03 sec.
2025-11-14 17:48:24,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,778 - INFO - Going to convert document batch...
2025-11-14 17:48:24,779 - INFO - Processing document 8-K_2024-02-07
2025-11-14 17:

Converted 'data\edgar_documents\UNH\8-K_2023-11-28' --> 'data\processed_data\UNH\8-K_2023-11-28.md'
Converted 'data\edgar_documents\UNH\8-K_2023-12-29' --> 'data\processed_data\UNH\8-K_2023-12-29.md'
Converted 'data\edgar_documents\UNH\8-K_2024-01-12' --> 'data\processed_data\UNH\8-K_2024-01-12.md'
Converted 'data\edgar_documents\UNH\8-K_2024-02-07' --> 'data\processed_data\UNH\8-K_2024-02-07.md'


2025-11-14 17:48:24,846 - INFO - Going to convert document batch...
2025-11-14 17:48:24,847 - INFO - Processing document 8-K_2024-02-09
2025-11-14 17:48:24,862 - INFO - Finished converting document 8-K_2024-02-09 in 0.06 sec.
2025-11-14 17:48:24,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,913 - INFO - Going to convert document batch...
2025-11-14 17:48:24,914 - INFO - Processing document 8-K_2024-02-22
2025-11-14 17:48:24,931 - INFO - Finished converting document 8-K_2024-02-22 in 0.06 sec.
2025-11-14 17:48:24,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:24,964 - INFO - Going to convert document batch...
2025-11-14 17:48:24,964 - INFO - Processing document 8-K_2024-03-08
2025-11-14 17:48:24,981 - INFO - Finished converting document 8-K_2024-03-08 in 0.05 sec.
2025-11-14 17:48:25,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,011 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\UNH\8-K_2024-02-09' --> 'data\processed_data\UNH\8-K_2024-02-09.md'
Converted 'data\edgar_documents\UNH\8-K_2024-02-22' --> 'data\processed_data\UNH\8-K_2024-02-22.md'
Converted 'data\edgar_documents\UNH\8-K_2024-03-08' --> 'data\processed_data\UNH\8-K_2024-03-08.md'


2025-11-14 17:48:25,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,066 - INFO - Going to convert document batch...
2025-11-14 17:48:25,066 - INFO - Processing document 8-K_2024-03-28
2025-11-14 17:48:25,082 - INFO - Finished converting document 8-K_2024-03-28 in 0.03 sec.
2025-11-14 17:48:25,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,110 - INFO - Going to convert document batch...
2025-11-14 17:48:25,111 - INFO - Processing document 8-K_2024-04-16
2025-11-14 17:48:25,129 - INFO - Finished converting document 8-K_2024-04-16 in 0.03 sec.
2025-11-14 17:48:25,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,160 - INFO - Going to convert document batch...
2025-11-14 17:48:25,161 - INFO - Processing document 8-K_2024-04-17
2025-11-14 17:48:25,176 - INFO - Finished converting document 8-K_2024-04-17 in 0.03 sec.
2025-11-14 17:48:25,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\UNH\8-K_2024-03-21' --> 'data\processed_data\UNH\8-K_2024-03-21.md'
Converted 'data\edgar_documents\UNH\8-K_2024-03-28' --> 'data\processed_data\UNH\8-K_2024-03-28.md'
Converted 'data\edgar_documents\UNH\8-K_2024-04-16' --> 'data\processed_data\UNH\8-K_2024-04-16.md'
Converted 'data\edgar_documents\UNH\8-K_2024-04-17' --> 'data\processed_data\UNH\8-K_2024-04-17.md'


2025-11-14 17:48:25,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,248 - INFO - Going to convert document batch...
2025-11-14 17:48:25,249 - INFO - Processing document 8-K_2024-05-09
2025-11-14 17:48:25,264 - INFO - Finished converting document 8-K_2024-05-09 in 0.03 sec.
2025-11-14 17:48:25,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,297 - INFO - Going to convert document batch...
2025-11-14 17:48:25,298 - INFO - Processing document 8-K_2024-05-15
2025-11-14 17:48:25,311 - INFO - Finished converting document 8-K_2024-05-15 in 0.05 sec.
2025-11-14 17:48:25,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,354 - INFO - Going to convert document batch...
2025-11-14 17:48:25,355 - INFO - Processing document 8-K_2024-05-24
2025-11-14 17:48:25,371 - INFO - Finished converting document 8-K_2024-05-24 in 0.06 sec.
2025-11-14 17:48:25,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\UNH\8-K_2024-04-24' --> 'data\processed_data\UNH\8-K_2024-04-24.md'
Converted 'data\edgar_documents\UNH\8-K_2024-05-09' --> 'data\processed_data\UNH\8-K_2024-05-09.md'
Converted 'data\edgar_documents\UNH\8-K_2024-05-15' --> 'data\processed_data\UNH\8-K_2024-05-15.md'
Converted 'data\edgar_documents\UNH\8-K_2024-05-24' --> 'data\processed_data\UNH\8-K_2024-05-24.md'


2025-11-14 17:48:25,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,460 - INFO - Going to convert document batch...
2025-11-14 17:48:25,461 - INFO - Processing document 8-K_2024-07-16
2025-11-14 17:48:25,478 - INFO - Finished converting document 8-K_2024-07-16 in 0.03 sec.
2025-11-14 17:48:25,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,516 - INFO - Going to convert document batch...
2025-11-14 17:48:25,517 - INFO - Processing document 8-K_2024-07-25
2025-11-14 17:48:25,546 - INFO - Finished converting document 8-K_2024-07-25 in 0.06 sec.
2025-11-14 17:48:25,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,589 - INFO - Going to convert document batch...
2025-11-14 17:48:25,590 - INFO - Processing document 8-K_2024-10-15
2025-11-14 17:48:25,609 - INFO - Finished converting document 8-K_2024-10-15 in 0.05 sec.
2025-11-14 17:48:25,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\8-K_2024-06-07' --> 'data\processed_data\UNH\8-K_2024-06-07.md'
Converted 'data\edgar_documents\UNH\8-K_2024-07-16' --> 'data\processed_data\UNH\8-K_2024-07-16.md'
Converted 'data\edgar_documents\UNH\8-K_2024-07-25' --> 'data\processed_data\UNH\8-K_2024-07-25.md'
Converted 'data\edgar_documents\UNH\8-K_2024-10-15' --> 'data\processed_data\UNH\8-K_2024-10-15.md'


2025-11-14 17:48:25,639 - INFO - Going to convert document batch...
2025-11-14 17:48:25,640 - INFO - Processing document 8-K_2024-11-26
2025-11-14 17:48:25,658 - INFO - Finished converting document 8-K_2024-11-26 in 0.05 sec.
2025-11-14 17:48:25,680 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,691 - INFO - Going to convert document batch...
2025-11-14 17:48:25,692 - INFO - Processing document 8-K_2024-12-03
2025-11-14 17:48:25,710 - INFO - Finished converting document 8-K_2024-12-03 in 0.03 sec.
2025-11-14 17:48:25,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,746 - INFO - Going to convert document batch...
2025-11-14 17:48:25,748 - INFO - Processing document 8-K_2024-12-04
2025-11-14 17:48:25,764 - INFO - Finished converting document 8-K_2024-12-04 in 0.05 sec.
2025-11-14 17:48:25,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:25,819 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\UNH\8-K_2024-11-26' --> 'data\processed_data\UNH\8-K_2024-11-26.md'
Converted 'data\edgar_documents\UNH\8-K_2024-12-03' --> 'data\processed_data\UNH\8-K_2024-12-03.md'
Converted 'data\edgar_documents\UNH\8-K_2024-12-04' --> 'data\processed_data\UNH\8-K_2024-12-04.md'
Converted 'data\edgar_documents\UNH\8-K_2025-01-16' --> 'data\processed_data\UNH\8-K_2025-01-16.md'


2025-11-14 17:48:26,087 - INFO - Going to convert document batch...
2025-11-14 17:48:26,088 - INFO - Processing document 8-K_2025-04-17
2025-11-14 17:48:26,104 - INFO - Finished converting document 8-K_2025-04-17 in 0.26 sec.
2025-11-14 17:48:26,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,139 - INFO - Going to convert document batch...
2025-11-14 17:48:26,141 - INFO - Processing document 8-K_2025-04-29
2025-11-14 17:48:26,179 - INFO - Finished converting document 8-K_2025-04-29 in 0.06 sec.
2025-11-14 17:48:26,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,231 - INFO - Going to convert document batch...
2025-11-14 17:48:26,233 - INFO - Processing document 8-K_2025-05-14
2025-11-14 17:48:26,269 - INFO - Finished converting document 8-K_2025-05-14 in 0.08 sec.
2025-11-14 17:48:26,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNH\8-K_2025-04-17' --> 'data\processed_data\UNH\8-K_2025-04-17.md'
Converted 'data\edgar_documents\UNH\8-K_2025-04-29' --> 'data\processed_data\UNH\8-K_2025-04-29.md'
Converted 'data\edgar_documents\UNH\8-K_2025-05-14' --> 'data\processed_data\UNH\8-K_2025-05-14.md'


2025-11-14 17:48:26,307 - INFO - Going to convert document batch...
2025-11-14 17:48:26,308 - INFO - Processing document 8-K_2025-05-21
2025-11-14 17:48:26,324 - INFO - Finished converting document 8-K_2025-05-21 in 0.05 sec.
2025-11-14 17:48:26,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,361 - INFO - Going to convert document batch...
2025-11-14 17:48:26,362 - INFO - Processing document 8-K_2025-06-04
2025-11-14 17:48:26,388 - INFO - Finished converting document 8-K_2025-06-04 in 0.06 sec.
2025-11-14 17:48:26,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,428 - INFO - Going to convert document batch...
2025-11-14 17:48:26,428 - INFO - Processing document 8-K_2025-06-20
2025-11-14 17:48:26,448 - INFO - Finished converting document 8-K_2025-06-20 in 0.05 sec.
2025-11-14 17:48:26,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,488 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\UNH\8-K_2025-05-21' --> 'data\processed_data\UNH\8-K_2025-05-21.md'
Converted 'data\edgar_documents\UNH\8-K_2025-06-04' --> 'data\processed_data\UNH\8-K_2025-06-04.md'
Converted 'data\edgar_documents\UNH\8-K_2025-06-20' --> 'data\processed_data\UNH\8-K_2025-06-20.md'


2025-11-14 17:48:26,520 - INFO - Finished converting document 8-K_2025-07-24 in 0.06 sec.
2025-11-14 17:48:26,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,555 - INFO - Going to convert document batch...
2025-11-14 17:48:26,556 - INFO - Processing document 8-K_2025-07-29
2025-11-14 17:48:26,574 - INFO - Finished converting document 8-K_2025-07-29 in 0.05 sec.
2025-11-14 17:48:26,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,611 - INFO - Going to convert document batch...
2025-11-14 17:48:26,611 - INFO - Processing document 8-K_2025-07-31
2025-11-14 17:48:26,635 - INFO - Finished converting document 8-K_2025-07-31 in 0.05 sec.
2025-11-14 17:48:26,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,667 - INFO - Going to convert document batch...
2025-11-14 17:48:26,668 - INFO - Processing document 8-K_2025-08-20
2025-11-14 17:48:26,683 - INFO - Finished converting document 8-K_2025-08-20 in 0.

Converted 'data\edgar_documents\UNH\8-K_2025-07-24' --> 'data\processed_data\UNH\8-K_2025-07-24.md'
Converted 'data\edgar_documents\UNH\8-K_2025-07-29' --> 'data\processed_data\UNH\8-K_2025-07-29.md'
Converted 'data\edgar_documents\UNH\8-K_2025-07-31' --> 'data\processed_data\UNH\8-K_2025-07-31.md'
Converted 'data\edgar_documents\UNH\8-K_2025-08-20' --> 'data\processed_data\UNH\8-K_2025-08-20.md'


2025-11-14 17:48:26,746 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,756 - INFO - Going to convert document batch...
2025-11-14 17:48:26,757 - INFO - Processing document 8-K_2025-09-09
2025-11-14 17:48:26,775 - INFO - Finished converting document 8-K_2025-09-09 in 0.03 sec.
2025-11-14 17:48:26,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,806 - INFO - Going to convert document batch...
2025-11-14 17:48:26,807 - INFO - Processing document 8-K_2025-10-28
2025-11-14 17:48:26,826 - INFO - Finished converting document 8-K_2025-10-28 in 0.05 sec.
2025-11-14 17:48:26,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:48:26,860 - INFO - Going to convert document batch...
2025-11-14 17:48:26,861 - INFO - Processing document 8-K_2025-11-07
2025-11-14 17:48:26,877 - INFO - Finished converting document 8-K_2025-11-07 in 0.05 sec.


Converted 'data\edgar_documents\UNH\8-K_2025-09-08' --> 'data\processed_data\UNH\8-K_2025-09-08.md'
Converted 'data\edgar_documents\UNH\8-K_2025-09-09' --> 'data\processed_data\UNH\8-K_2025-09-09.md'
Converted 'data\edgar_documents\UNH\8-K_2025-10-28' --> 'data\processed_data\UNH\8-K_2025-10-28.md'
Converted 'data\edgar_documents\UNH\8-K_2025-11-07' --> 'data\processed_data\UNH\8-K_2025-11-07.md'


2025-11-14 17:48:26,937 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:48:26,938 - ERROR - Input document DEF-14A_2023-04-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:48:26,941 - INFO - Going to convert document batch...
2025-11-14 17:48:26,994 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:48:26,995 - ERROR - Input document DEF-14A_2024-04-22 with format No

Error processing data\edgar_documents\UNH\DEF-14A_2023-04-21: File format not allowed: data\edgar_documents\UNH\DEF-14A_2023-04-21
Error processing data\edgar_documents\UNH\DEF-14A_2024-04-22: File format not allowed: data\edgar_documents\UNH\DEF-14A_2024-04-22
Error processing data\edgar_documents\UNH\DEF-14A_2025-04-21: File format not allowed: data\edgar_documents\UNH\DEF-14A_2025-04-21
Processed 131 new files. Errors: 10
Found 160 files to process in data\edgar_documents\UNP


2025-11-14 17:48:27,965 - INFO - Going to convert document batch...
2025-11-14 17:48:27,966 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:48:27,966 - INFO - Processing document 10-K_2023-02-10
2025-11-14 17:48:33,118 - INFO - Finished converting document 10-K_2023-02-10 in 6.05 sec.
2025-11-14 17:48:33,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-K_2023-02-10' --> 'data\processed_data\UNP\10-K_2023-02-10.md'


2025-11-14 17:48:34,742 - INFO - Going to convert document batch...
2025-11-14 17:48:34,743 - INFO - Processing document 10-K_2024-02-09
2025-11-14 17:48:39,675 - INFO - Finished converting document 10-K_2024-02-09 in 5.86 sec.
2025-11-14 17:48:40,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-K_2024-02-09' --> 'data\processed_data\UNP\10-K_2024-02-09.md'


2025-11-14 17:48:41,138 - INFO - Going to convert document batch...
2025-11-14 17:48:41,139 - INFO - Processing document 10-K_2025-02-07
2025-11-14 17:48:41,955 - INFO - Finished converting document 10-K_2025-02-07 in 1.61 sec.
2025-11-14 17:48:42,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-K_2025-02-07' --> 'data\processed_data\UNP\10-K_2025-02-07.md'


2025-11-14 17:48:42,660 - INFO - Going to convert document batch...
2025-11-14 17:48:42,660 - INFO - Processing document 10-Q_2023-04-20
2025-11-14 17:48:44,092 - INFO - Finished converting document 10-Q_2023-04-20 in 1.80 sec.
2025-11-14 17:48:44,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-Q_2023-04-20' --> 'data\processed_data\UNP\10-Q_2023-04-20.md'


2025-11-14 17:48:45,276 - INFO - Going to convert document batch...
2025-11-14 17:48:45,277 - INFO - Processing document 10-Q_2023-07-26
2025-11-14 17:48:47,724 - INFO - Finished converting document 10-Q_2023-07-26 in 3.31 sec.
2025-11-14 17:48:48,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-Q_2023-07-26' --> 'data\processed_data\UNP\10-Q_2023-07-26.md'


2025-11-14 17:48:48,886 - INFO - Going to convert document batch...
2025-11-14 17:48:48,887 - INFO - Processing document 10-Q_2023-10-19
2025-11-14 17:48:51,345 - INFO - Finished converting document 10-Q_2023-10-19 in 3.16 sec.
2025-11-14 17:48:51,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-Q_2023-10-19' --> 'data\processed_data\UNP\10-Q_2023-10-19.md'


2025-11-14 17:48:52,129 - INFO - Going to convert document batch...
2025-11-14 17:48:52,129 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 17:48:53,808 - INFO - Finished converting document 10-Q_2024-04-25 in 2.00 sec.
2025-11-14 17:48:54,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-Q_2024-04-25' --> 'data\processed_data\UNP\10-Q_2024-04-25.md'


2025-11-14 17:48:54,563 - INFO - Going to convert document batch...
2025-11-14 17:48:54,564 - INFO - Processing document 10-Q_2024-07-25
2025-11-14 17:48:56,974 - INFO - Finished converting document 10-Q_2024-07-25 in 2.84 sec.
2025-11-14 17:48:57,460 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-Q_2024-07-25' --> 'data\processed_data\UNP\10-Q_2024-07-25.md'


2025-11-14 17:48:58,240 - INFO - Going to convert document batch...
2025-11-14 17:48:58,240 - INFO - Processing document 10-Q_2024-10-24
2025-11-14 17:49:00,833 - INFO - Finished converting document 10-Q_2024-10-24 in 3.41 sec.
2025-11-14 17:49:01,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-Q_2024-10-24' --> 'data\processed_data\UNP\10-Q_2024-10-24.md'


2025-11-14 17:49:01,525 - INFO - Going to convert document batch...
2025-11-14 17:49:01,527 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 17:49:01,976 - INFO - Finished converting document 10-Q_2025-04-24 in 0.67 sec.
2025-11-14 17:49:02,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-Q_2025-04-24' --> 'data\processed_data\UNP\10-Q_2025-04-24.md'


2025-11-14 17:49:02,838 - INFO - Going to convert document batch...
2025-11-14 17:49:02,839 - INFO - Processing document 10-Q_2025-07-24
2025-11-14 17:49:03,373 - INFO - Finished converting document 10-Q_2025-07-24 in 1.19 sec.
2025-11-14 17:49:03,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\10-Q_2025-07-24' --> 'data\processed_data\UNP\10-Q_2025-07-24.md'


2025-11-14 17:49:03,905 - INFO - Going to convert document batch...
2025-11-14 17:49:03,905 - INFO - Processing document 10-Q_2025-10-23
2025-11-14 17:49:04,466 - INFO - Finished converting document 10-Q_2025-10-23 in 0.86 sec.
2025-11-14 17:49:04,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:04,757 - INFO - Going to convert document batch...
2025-11-14 17:49:04,757 - INFO - Processing document 4_2023-01-04
2025-11-14 17:49:04,777 - INFO - Finished converting document 4_2023-01-04 in 0.06 sec.
2025-11-14 17:49:04,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:04,843 - INFO - Going to convert document batch...
2025-11-14 17:49:04,844 - INFO - Processing document 4_2023-01-11
2025-11-14 17:49:04,864 - INFO - Finished converting document 4_2023-01-11 in 0.06 sec.
2025-11-14 17:49:04,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:04,907 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\UNP\10-Q_2025-10-23' --> 'data\processed_data\UNP\10-Q_2025-10-23.md'
Converted 'data\edgar_documents\UNP\4_2023-01-04' --> 'data\processed_data\UNP\4_2023-01-04.md'
Converted 'data\edgar_documents\UNP\4_2023-01-11' --> 'data\processed_data\UNP\4_2023-01-11.md'


2025-11-14 17:49:04,907 - INFO - Processing document 4_2023-02-13
2025-11-14 17:49:04,935 - INFO - Finished converting document 4_2023-02-13 in 0.06 sec.
2025-11-14 17:49:04,977 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:04,978 - ERROR - Input document 4_2023-02-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:04,979 - INFO - Going to convert document batch...
2025-11-14 17:49:04,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49

Converted 'data\edgar_documents\UNP\4_2023-02-13' --> 'data\processed_data\UNP\4_2023-02-13.md'
Error processing data\edgar_documents\UNP\4_2023-02-15: File format not allowed: data\edgar_documents\UNP\4_2023-02-15
Converted 'data\edgar_documents\UNP\4_2023-03-01' --> 'data\processed_data\UNP\4_2023-03-01.md'
Converted 'data\edgar_documents\UNP\4_2023-03-14' --> 'data\processed_data\UNP\4_2023-03-14.md'


2025-11-14 17:49:05,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:05,181 - INFO - Going to convert document batch...
2025-11-14 17:49:05,181 - INFO - Processing document 4_2023-04-11
2025-11-14 17:49:05,203 - INFO - Finished converting document 4_2023-04-11 in 0.05 sec.
2025-11-14 17:49:05,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:05,261 - INFO - Going to convert document batch...
2025-11-14 17:49:05,263 - INFO - Processing document 4_2023-05-12
2025-11-14 17:49:05,302 - INFO - Finished converting document 4_2023-05-12 in 0.08 sec.
2025-11-14 17:49:05,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\4_2023-04-04' --> 'data\processed_data\UNP\4_2023-04-04.md'
Converted 'data\edgar_documents\UNP\4_2023-04-11' --> 'data\processed_data\UNP\4_2023-04-11.md'
Converted 'data\edgar_documents\UNP\4_2023-05-12' --> 'data\processed_data\UNP\4_2023-05-12.md'


2025-11-14 17:49:05,353 - INFO - Going to convert document batch...
2025-11-14 17:49:05,354 - INFO - Processing document 4_2023-06-13
2025-11-14 17:49:05,375 - INFO - Finished converting document 4_2023-06-13 in 0.05 sec.
2025-11-14 17:49:05,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:05,424 - INFO - Going to convert document batch...
2025-11-14 17:49:05,424 - INFO - Processing document 4_2023-07-05
2025-11-14 17:49:05,446 - INFO - Finished converting document 4_2023-07-05 in 0.03 sec.
2025-11-14 17:49:05,482 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:05,492 - INFO - Going to convert document batch...
2025-11-14 17:49:05,493 - INFO - Processing document 4_2023-07-12
2025-11-14 17:49:05,514 - INFO - Finished converting document 4_2023-07-12 in 0.05 sec.
2025-11-14 17:49:05,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:05,580 - INFO - Going to convert document batch...
2025-11-14 17:49:05,580 - 

Converted 'data\edgar_documents\UNP\4_2023-06-13' --> 'data\processed_data\UNP\4_2023-06-13.md'
Converted 'data\edgar_documents\UNP\4_2023-07-05' --> 'data\processed_data\UNP\4_2023-07-05.md'
Converted 'data\edgar_documents\UNP\4_2023-07-12' --> 'data\processed_data\UNP\4_2023-07-12.md'


2025-11-14 17:49:05,600 - INFO - Finished converting document 4_2023-08-14 in 0.06 sec.
2025-11-14 17:49:05,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\4_2023-08-14' --> 'data\processed_data\UNP\4_2023-08-14.md'


2025-11-14 17:49:05,935 - INFO - Going to convert document batch...
2025-11-14 17:49:05,936 - INFO - Processing document 4_2023-08-24
2025-11-14 17:49:05,962 - INFO - Finished converting document 4_2023-08-24 in 0.33 sec.
2025-11-14 17:49:06,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,008 - INFO - Going to convert document batch...
2025-11-14 17:49:06,008 - INFO - Processing document 4_2023-08-25
2025-11-14 17:49:06,026 - INFO - Finished converting document 4_2023-08-25 in 0.05 sec.
2025-11-14 17:49:06,076 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,091 - INFO - Going to convert document batch...
2025-11-14 17:49:06,093 - INFO - Processing document 4_2023-09-11
2025-11-14 17:49:06,114 - INFO - Finished converting document 4_2023-09-11 in 0.06 sec.
2025-11-14 17:49:06,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,152 - INFO - Going to convert document batch...
2025-11-14 17:49:06,153 - 

Converted 'data\edgar_documents\UNP\4_2023-08-24' --> 'data\processed_data\UNP\4_2023-08-24.md'
Converted 'data\edgar_documents\UNP\4_2023-08-25' --> 'data\processed_data\UNP\4_2023-08-25.md'
Converted 'data\edgar_documents\UNP\4_2023-09-11' --> 'data\processed_data\UNP\4_2023-09-11.md'


2025-11-14 17:49:06,172 - INFO - Finished converting document 4_2023-10-03 in 0.05 sec.
2025-11-14 17:49:06,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,210 - INFO - Going to convert document batch...
2025-11-14 17:49:06,211 - INFO - Processing document 4_2023-10-31
2025-11-14 17:49:06,229 - INFO - Finished converting document 4_2023-10-31 in 0.05 sec.
2025-11-14 17:49:06,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,271 - INFO - Going to convert document batch...
2025-11-14 17:49:06,272 - INFO - Processing document 4_2023-11-14
2025-11-14 17:49:06,290 - INFO - Finished converting document 4_2023-11-14 in 0.03 sec.
2025-11-14 17:49:06,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,326 - INFO - Going to convert document batch...
2025-11-14 17:49:06,327 - INFO - Processing document 4_2023-11-21
2025-11-14 17:49:06,345 - INFO - Finished converting document 4_2023-11-21 in 0.03 sec.
2025-1

Converted 'data\edgar_documents\UNP\4_2023-10-03' --> 'data\processed_data\UNP\4_2023-10-03.md'
Converted 'data\edgar_documents\UNP\4_2023-10-31' --> 'data\processed_data\UNP\4_2023-10-31.md'
Converted 'data\edgar_documents\UNP\4_2023-11-14' --> 'data\processed_data\UNP\4_2023-11-14.md'
Converted 'data\edgar_documents\UNP\4_2023-11-21' --> 'data\processed_data\UNP\4_2023-11-21.md'


2025-11-14 17:49:06,384 - INFO - Going to convert document batch...
2025-11-14 17:49:06,385 - INFO - Processing document 4_2023-12-11
2025-11-14 17:49:06,405 - INFO - Finished converting document 4_2023-12-11 in 0.05 sec.
2025-11-14 17:49:06,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,448 - INFO - Going to convert document batch...
2025-11-14 17:49:06,449 - INFO - Processing document 4_2023-12-14
2025-11-14 17:49:06,467 - INFO - Finished converting document 4_2023-12-14 in 0.05 sec.
2025-11-14 17:49:06,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,521 - INFO - Going to convert document batch...
2025-11-14 17:49:06,521 - INFO - Processing document 4_2024-01-03
2025-11-14 17:49:06,541 - INFO - Finished converting document 4_2024-01-03 in 0.06 sec.
2025-11-14 17:49:06,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,580 - INFO - Going to convert document batch...
2025-11-14 17:49:06,581 - 

Converted 'data\edgar_documents\UNP\4_2023-12-11' --> 'data\processed_data\UNP\4_2023-12-11.md'
Converted 'data\edgar_documents\UNP\4_2023-12-14' --> 'data\processed_data\UNP\4_2023-12-14.md'
Converted 'data\edgar_documents\UNP\4_2024-01-03' --> 'data\processed_data\UNP\4_2024-01-03.md'


2025-11-14 17:49:06,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,642 - INFO - Going to convert document batch...
2025-11-14 17:49:06,644 - INFO - Processing document 4_2024-02-06
2025-11-14 17:49:06,665 - INFO - Finished converting document 4_2024-02-06 in 0.03 sec.
2025-11-14 17:49:06,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,730 - INFO - Going to convert document batch...
2025-11-14 17:49:06,732 - INFO - Processing document 4_2024-02-12
2025-11-14 17:49:06,780 - INFO - Finished converting document 4_2024-02-12 in 0.09 sec.


Converted 'data\edgar_documents\UNP\4_2024-01-11' --> 'data\processed_data\UNP\4_2024-01-11.md'
Converted 'data\edgar_documents\UNP\4_2024-02-06' --> 'data\processed_data\UNP\4_2024-02-06.md'
Converted 'data\edgar_documents\UNP\4_2024-02-12' --> 'data\processed_data\UNP\4_2024-02-12.md'


2025-11-14 17:49:06,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,846 - INFO - Going to convert document batch...
2025-11-14 17:49:06,847 - INFO - Processing document 4_2024-02-16
2025-11-14 17:49:06,874 - INFO - Finished converting document 4_2024-02-16 in 0.06 sec.
2025-11-14 17:49:06,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,924 - INFO - Going to convert document batch...
2025-11-14 17:49:06,925 - INFO - Processing document 4_2024-02-28
2025-11-14 17:49:06,946 - INFO - Finished converting document 4_2024-02-28 in 0.03 sec.
2025-11-14 17:49:06,977 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:06,984 - INFO - Going to convert document batch...
2025-11-14 17:49:06,985 - INFO - Processing document 4_2024-03-11
2025-11-14 17:49:07,002 - INFO - Finished converting document 4_2024-03-11 in 0.03 sec.
2025-11-14 17:49:07,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\UNP\4_2024-02-16' --> 'data\processed_data\UNP\4_2024-02-16.md'
Converted 'data\edgar_documents\UNP\4_2024-02-28' --> 'data\processed_data\UNP\4_2024-02-28.md'
Converted 'data\edgar_documents\UNP\4_2024-03-11' --> 'data\processed_data\UNP\4_2024-03-11.md'
Converted 'data\edgar_documents\UNP\4_2024-04-02' --> 'data\processed_data\UNP\4_2024-04-02.md'


2025-11-14 17:49:07,097 - INFO - Going to convert document batch...
2025-11-14 17:49:07,098 - INFO - Processing document 4_2024-04-11
2025-11-14 17:49:07,116 - INFO - Finished converting document 4_2024-04-11 in 0.03 sec.
2025-11-14 17:49:07,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,168 - INFO - Going to convert document batch...
2025-11-14 17:49:07,169 - INFO - Processing document 4_2024-05-13
2025-11-14 17:49:07,207 - INFO - Finished converting document 4_2024-05-13 in 0.06 sec.
2025-11-14 17:49:07,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,256 - INFO - Going to convert document batch...
2025-11-14 17:49:07,257 - INFO - Processing document 4_2024-06-12
2025-11-14 17:49:07,277 - INFO - Finished converting document 4_2024-06-12 in 0.05 sec.
2025-11-14 17:49:07,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\4_2024-04-11' --> 'data\processed_data\UNP\4_2024-04-11.md'
Converted 'data\edgar_documents\UNP\4_2024-05-13' --> 'data\processed_data\UNP\4_2024-05-13.md'
Converted 'data\edgar_documents\UNP\4_2024-06-12' --> 'data\processed_data\UNP\4_2024-06-12.md'


2025-11-14 17:49:07,337 - INFO - Going to convert document batch...
2025-11-14 17:49:07,338 - INFO - Processing document 4_2024-07-02
2025-11-14 17:49:07,357 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.
2025-11-14 17:49:07,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,399 - INFO - Going to convert document batch...
2025-11-14 17:49:07,400 - INFO - Processing document 4_2024-07-10
2025-11-14 17:49:07,421 - INFO - Finished converting document 4_2024-07-10 in 0.05 sec.
2025-11-14 17:49:07,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,472 - INFO - Going to convert document batch...
2025-11-14 17:49:07,474 - INFO - Processing document 4_2024-08-01
2025-11-14 17:49:07,494 - INFO - Finished converting document 4_2024-08-01 in 0.05 sec.
2025-11-14 17:49:07,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,533 - INFO - Going to convert document batch...
2025-11-14 17:49:07,534 - 

Converted 'data\edgar_documents\UNP\4_2024-07-02' --> 'data\processed_data\UNP\4_2024-07-02.md'
Converted 'data\edgar_documents\UNP\4_2024-07-10' --> 'data\processed_data\UNP\4_2024-07-10.md'
Converted 'data\edgar_documents\UNP\4_2024-08-01' --> 'data\processed_data\UNP\4_2024-08-01.md'
Converted 'data\edgar_documents\UNP\4_2024-08-12' --> 'data\processed_data\UNP\4_2024-08-12.md'


2025-11-14 17:49:07,592 - INFO - Going to convert document batch...
2025-11-14 17:49:07,594 - INFO - Processing document 4_2024-09-11
2025-11-14 17:49:07,613 - INFO - Finished converting document 4_2024-09-11 in 0.05 sec.
2025-11-14 17:49:07,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,655 - INFO - Going to convert document batch...
2025-11-14 17:49:07,656 - INFO - Processing document 4_2024-10-03
2025-11-14 17:49:07,674 - INFO - Finished converting document 4_2024-10-03 in 0.05 sec.
2025-11-14 17:49:07,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,712 - INFO - Going to convert document batch...
2025-11-14 17:49:07,713 - INFO - Processing document 4_2024-10-11
2025-11-14 17:49:07,733 - INFO - Finished converting document 4_2024-10-11 in 0.05 sec.
2025-11-14 17:49:07,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,789 - INFO - Going to convert document batch...
2025-11-14 17:49:07,789 - 

Converted 'data\edgar_documents\UNP\4_2024-09-11' --> 'data\processed_data\UNP\4_2024-09-11.md'
Converted 'data\edgar_documents\UNP\4_2024-10-03' --> 'data\processed_data\UNP\4_2024-10-03.md'
Converted 'data\edgar_documents\UNP\4_2024-10-11' --> 'data\processed_data\UNP\4_2024-10-11.md'


2025-11-14 17:49:07,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,845 - INFO - Going to convert document batch...
2025-11-14 17:49:07,846 - INFO - Processing document 4_2024-11-07
2025-11-14 17:49:07,866 - INFO - Finished converting document 4_2024-11-07 in 0.03 sec.
2025-11-14 17:49:07,901 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,912 - INFO - Going to convert document batch...
2025-11-14 17:49:07,913 - INFO - Processing document 4_2024-11-12
2025-11-14 17:49:07,941 - INFO - Finished converting document 4_2024-11-12 in 0.05 sec.
2025-11-14 17:49:07,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:07,992 - INFO - Going to convert document batch...
2025-11-14 17:49:07,993 - INFO - Processing document 4_2024-12-04


Converted 'data\edgar_documents\UNP\4_2024-11-05' --> 'data\processed_data\UNP\4_2024-11-05.md'
Converted 'data\edgar_documents\UNP\4_2024-11-07' --> 'data\processed_data\UNP\4_2024-11-07.md'
Converted 'data\edgar_documents\UNP\4_2024-11-12' --> 'data\processed_data\UNP\4_2024-11-12.md'


2025-11-14 17:49:08,017 - INFO - Finished converting document 4_2024-12-04 in 0.05 sec.
2025-11-14 17:49:08,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,063 - INFO - Going to convert document batch...
2025-11-14 17:49:08,064 - INFO - Processing document 4_2024-12-12
2025-11-14 17:49:08,085 - INFO - Finished converting document 4_2024-12-12 in 0.03 sec.
2025-11-14 17:49:08,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,147 - INFO - Going to convert document batch...
2025-11-14 17:49:08,149 - INFO - Processing document 4_2024-12-13
2025-11-14 17:49:08,172 - INFO - Finished converting document 4_2024-12-13 in 0.06 sec.
2025-11-14 17:49:08,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,216 - INFO - Going to convert document batch...
2025-11-14 17:49:08,217 - INFO - Processing document 4_2025-01-03
2025-11-14 17:49:08,237 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.


Converted 'data\edgar_documents\UNP\4_2024-12-04' --> 'data\processed_data\UNP\4_2024-12-04.md'
Converted 'data\edgar_documents\UNP\4_2024-12-12' --> 'data\processed_data\UNP\4_2024-12-12.md'
Converted 'data\edgar_documents\UNP\4_2024-12-13' --> 'data\processed_data\UNP\4_2024-12-13.md'


2025-11-14 17:49:08,270 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,279 - INFO - Going to convert document batch...
2025-11-14 17:49:08,280 - INFO - Processing document 4_2025-01-08
2025-11-14 17:49:08,302 - INFO - Finished converting document 4_2025-01-08 in 0.05 sec.
2025-11-14 17:49:08,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,349 - INFO - Going to convert document batch...
2025-11-14 17:49:08,350 - INFO - Processing document 4_2025-01-13
2025-11-14 17:49:08,375 - INFO - Finished converting document 4_2025-01-13 in 0.05 sec.
2025-11-14 17:49:08,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,425 - INFO - Going to convert document batch...
2025-11-14 17:49:08,426 - INFO - Processing document 4_2025-01-28


Converted 'data\edgar_documents\UNP\4_2025-01-03' --> 'data\processed_data\UNP\4_2025-01-03.md'
Converted 'data\edgar_documents\UNP\4_2025-01-08' --> 'data\processed_data\UNP\4_2025-01-08.md'
Converted 'data\edgar_documents\UNP\4_2025-01-13' --> 'data\processed_data\UNP\4_2025-01-13.md'


2025-11-14 17:49:08,453 - INFO - Finished converting document 4_2025-01-28 in 0.06 sec.
2025-11-14 17:49:08,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,502 - INFO - Going to convert document batch...
2025-11-14 17:49:08,502 - INFO - Processing document 4_2025-01-29
2025-11-14 17:49:08,526 - INFO - Finished converting document 4_2025-01-29 in 0.05 sec.
2025-11-14 17:49:08,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,590 - INFO - Going to convert document batch...
2025-11-14 17:49:08,590 - INFO - Processing document 4_2025-02-06
2025-11-14 17:49:08,616 - INFO - Finished converting document 4_2025-02-06 in 0.06 sec.
2025-11-14 17:49:08,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,661 - INFO - Going to convert document batch...
2025-11-14 17:49:08,662 - INFO - Processing document 4_2025-02-07
2025-11-14 17:49:08,683 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.


Converted 'data\edgar_documents\UNP\4_2025-01-28' --> 'data\processed_data\UNP\4_2025-01-28.md'
Converted 'data\edgar_documents\UNP\4_2025-01-29' --> 'data\processed_data\UNP\4_2025-01-29.md'
Converted 'data\edgar_documents\UNP\4_2025-02-06' --> 'data\processed_data\UNP\4_2025-02-06.md'


2025-11-14 17:49:08,722 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:08,723 - ERROR - Input document 4_2025-02-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:08,724 - INFO - Going to convert document batch...
2025-11-14 17:49:08,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,746 - INFO - Going to convert document batch...
2025-11-14 17:49:08,747 - INFO - Processing document 4_2025-02-11
2025-11-14 17:49:08,771 - INFO - Fin

Converted 'data\edgar_documents\UNP\4_2025-02-07' --> 'data\processed_data\UNP\4_2025-02-07.md'
Error processing data\edgar_documents\UNP\4_2025-02-10: File format not allowed: data\edgar_documents\UNP\4_2025-02-10
Converted 'data\edgar_documents\UNP\4_2025-02-11' --> 'data\processed_data\UNP\4_2025-02-11.md'
Error processing data\edgar_documents\UNP\4_2025-02-12: File format not allowed: data\edgar_documents\UNP\4_2025-02-12


2025-11-14 17:49:08,950 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:08,964 - INFO - Going to convert document batch...
2025-11-14 17:49:08,965 - INFO - Processing document 4_2025-04-02
2025-11-14 17:49:08,997 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.
2025-11-14 17:49:09,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:09,047 - INFO - Going to convert document batch...
2025-11-14 17:49:09,048 - INFO - Processing document 4_2025-04-11
2025-11-14 17:49:09,069 - INFO - Finished converting document 4_2025-04-11 in 0.03 sec.
2025-11-14 17:49:09,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:09,115 - INFO - Going to convert document batch...
2025-11-14 17:49:09,115 - INFO - Processing document 4_2025-04-29
2025-11-14 17:49:09,137 - INFO - Finished converting document 4_2025-04-29 in 0.05 sec.


Converted 'data\edgar_documents\UNP\4_2025-03-11' --> 'data\processed_data\UNP\4_2025-03-11.md'
Converted 'data\edgar_documents\UNP\4_2025-04-02' --> 'data\processed_data\UNP\4_2025-04-02.md'
Converted 'data\edgar_documents\UNP\4_2025-04-11' --> 'data\processed_data\UNP\4_2025-04-11.md'


2025-11-14 17:49:09,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:09,178 - INFO - Going to convert document batch...
2025-11-14 17:49:09,179 - INFO - Processing document 4_2025-05-12
2025-11-14 17:49:09,200 - INFO - Finished converting document 4_2025-05-12 in 0.05 sec.
2025-11-14 17:49:09,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:09,242 - INFO - Going to convert document batch...
2025-11-14 17:49:09,242 - INFO - Processing document 4_2025-06-11
2025-11-14 17:49:09,263 - INFO - Finished converting document 4_2025-06-11 in 0.05 sec.
2025-11-14 17:49:09,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:09,302 - INFO - Going to convert document batch...
2025-11-14 17:49:09,303 - INFO - Processing document 4_2025-07-02
2025-11-14 17:49:09,322 - INFO - Finished converting document 4_2025-07-02 in 0.03 sec.
2025-11-14 17:49:09,354 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\4_2025-04-29' --> 'data\processed_data\UNP\4_2025-04-29.md'
Converted 'data\edgar_documents\UNP\4_2025-05-12' --> 'data\processed_data\UNP\4_2025-05-12.md'
Converted 'data\edgar_documents\UNP\4_2025-06-11' --> 'data\processed_data\UNP\4_2025-06-11.md'
Converted 'data\edgar_documents\UNP\4_2025-07-02' --> 'data\processed_data\UNP\4_2025-07-02.md'


2025-11-14 17:49:09,362 - INFO - Going to convert document batch...
2025-11-14 17:49:09,363 - INFO - Processing document 4_2025-07-03
2025-11-14 17:49:09,383 - INFO - Finished converting document 4_2025-07-03 in 0.03 sec.
2025-11-14 17:49:09,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:09,438 - INFO - Going to convert document batch...
2025-11-14 17:49:09,439 - INFO - Processing document 4_2025-07-11
2025-11-14 17:49:09,473 - INFO - Finished converting document 4_2025-07-11 in 0.06 sec.
2025-11-14 17:49:09,507 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:09,507 - ERROR - Input document 4_2025-07-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\UNP\4_2025-07-03' --> 'data\processed_data\UNP\4_2025-07-03.md'
Converted 'data\edgar_documents\UNP\4_2025-07-11' --> 'data\processed_data\UNP\4_2025-07-11.md'
Error processing data\edgar_documents\UNP\4_2025-07-29: File format not allowed: data\edgar_documents\UNP\4_2025-07-29
Error processing data\edgar_documents\UNP\4_2025-07-30: File format not allowed: data\edgar_documents\UNP\4_2025-07-30
Error processing data\edgar_documents\UNP\4_2025-07-31: File format not allowed: data\edgar_documents\UNP\4_2025-07-31
Error processing data\edgar_documents\UNP\4_2025-08-04: File format not allowed: data\edgar_documents\UNP\4_2025-08-04
Error processing data\edgar_documents\UNP\4_2025-08-05: File format not allowed: data\edgar_documents\UNP\4_2025-08-05
Error processing data\edgar_documents\UNP\4_2025-08-06: File format not allowed: data\edgar_documents\UNP\4_2025-08-06


2025-11-14 17:49:09,598 - ERROR - Input document 4_2025-08-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:09,599 - INFO - Going to convert document batch...
2025-11-14 17:49:09,613 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:09,614 - ERROR - Input document 4_2025-08-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\UNP\4_2025-08-07: File format not allowed: data\edgar_documents\UNP\4_2025-08-07
Error processing data\edgar_documents\UNP\4_2025-08-11: File format not allowed: data\edgar_documents\UNP\4_2025-08-11
Error processing data\edgar_documents\UNP\4_2025-08-12: File format not allowed: data\edgar_documents\UNP\4_2025-08-12
Error processing data\edgar_documents\UNP\4_2025-08-13: File format not allowed: data\edgar_documents\UNP\4_2025-08-13
Error processing data\edgar_documents\UNP\4_2025-08-14: File format not allowed: data\edgar_documents\UNP\4_2025-08-14
Error processing data\edgar_documents\UNP\4_2025-08-18: File format not allowed: data\edgar_documents\UNP\4_2025-08-18
Error processing data\edgar_documents\UNP\4_2025-08-19: File format not allowed: data\edgar_documents\UNP\4_2025-08-19
Error processing data\edgar_documents\UNP\4_2025-08-20: File format not allowed: data\edgar_documents\UNP\4_2025-08-20
Error processing data\edgar_documents\UNP\4_2025

2025-11-14 17:49:09,779 - ERROR - Input document 4_2025-08-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:09,781 - INFO - Going to convert document batch...
2025-11-14 17:49:09,795 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:09,796 - ERROR - Input document 4_2025-08-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\UNP\4_2025-08-25: File format not allowed: data\edgar_documents\UNP\4_2025-08-25
Error processing data\edgar_documents\UNP\4_2025-08-26: File format not allowed: data\edgar_documents\UNP\4_2025-08-26
Error processing data\edgar_documents\UNP\4_2025-08-27: File format not allowed: data\edgar_documents\UNP\4_2025-08-27
Error processing data\edgar_documents\UNP\4_2025-08-28: File format not allowed: data\edgar_documents\UNP\4_2025-08-28
Error processing data\edgar_documents\UNP\4_2025-09-03: File format not allowed: data\edgar_documents\UNP\4_2025-09-03
Error processing data\edgar_documents\UNP\4_2025-09-05: File format not allowed: data\edgar_documents\UNP\4_2025-09-05
Error processing data\edgar_documents\UNP\4_2025-09-10: File format not allowed: data\edgar_documents\UNP\4_2025-09-10
Converted 'data\edgar_documents\UNP\4_2025-09-11' --> 'data\processed_data\UNP\4_2025-09-11.md'
Error processing data\edgar_documents\UNP\4_2025-09-12: File format not

2025-11-14 17:49:09,968 - ERROR - Input document 4_2025-09-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:09,969 - INFO - Going to convert document batch...
2025-11-14 17:49:09,981 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:09,982 - ERROR - Input document 4_2025-09-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\UNP\4_2025-09-16: File format not allowed: data\edgar_documents\UNP\4_2025-09-16
Error processing data\edgar_documents\UNP\4_2025-09-17: File format not allowed: data\edgar_documents\UNP\4_2025-09-17
Error processing data\edgar_documents\UNP\4_2025-09-19: File format not allowed: data\edgar_documents\UNP\4_2025-09-19
Error processing data\edgar_documents\UNP\4_2025-09-22: File format not allowed: data\edgar_documents\UNP\4_2025-09-22
Error processing data\edgar_documents\UNP\4_2025-09-23: File format not allowed: data\edgar_documents\UNP\4_2025-09-23
Error processing data\edgar_documents\UNP\4_2025-09-24: File format not allowed: data\edgar_documents\UNP\4_2025-09-24
Error processing data\edgar_documents\UNP\4_2025-09-26: File format not allowed: data\edgar_documents\UNP\4_2025-09-26
Error processing data\edgar_documents\UNP\4_2025-09-30: File format not allowed: data\edgar_documents\UNP\4_2025-09-30
Error processing data\edgar_documents\UNP\4_2025

2025-11-14 17:49:10,158 - ERROR - Input document 4_2025-10-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:10,159 - INFO - Going to convert document batch...
2025-11-14 17:49:10,170 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:10,171 - ERROR - Input document 4_2025-10-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\UNP\4_2025-10-10: File format not allowed: data\edgar_documents\UNP\4_2025-10-10
Error processing data\edgar_documents\UNP\4_2025-10-14: File format not allowed: data\edgar_documents\UNP\4_2025-10-14
Error processing data\edgar_documents\UNP\4_2025-10-15: File format not allowed: data\edgar_documents\UNP\4_2025-10-15
Error processing data\edgar_documents\UNP\4_2025-10-20: File format not allowed: data\edgar_documents\UNP\4_2025-10-20
Error processing data\edgar_documents\UNP\4_2025-10-22: File format not allowed: data\edgar_documents\UNP\4_2025-10-22
Error processing data\edgar_documents\UNP\4_2025-10-23: File format not allowed: data\edgar_documents\UNP\4_2025-10-23
Error processing data\edgar_documents\UNP\4_2025-10-27: File format not allowed: data\edgar_documents\UNP\4_2025-10-27
Error processing data\edgar_documents\UNP\4_2025-10-28: File format not allowed: data\edgar_documents\UNP\4_2025-10-28
Error processing data\edgar_documents\UNP\4_2025

2025-11-14 17:49:10,339 - ERROR - Input document 4_2025-11-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:10,340 - INFO - Going to convert document batch...
2025-11-14 17:49:10,354 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:10,355 - ERROR - Input document 4_2025-11-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\UNP\4_2025-11-05: File format not allowed: data\edgar_documents\UNP\4_2025-11-05
Error processing data\edgar_documents\UNP\4_2025-11-06: File format not allowed: data\edgar_documents\UNP\4_2025-11-06
Error processing data\edgar_documents\UNP\4_2025-11-07: File format not allowed: data\edgar_documents\UNP\4_2025-11-07
Error processing data\edgar_documents\UNP\4_2025-11-10: File format not allowed: data\edgar_documents\UNP\4_2025-11-10
Converted 'data\edgar_documents\UNP\8-K_2023-01-24' --> 'data\processed_data\UNP\8-K_2023-01-24.md'
Converted 'data\edgar_documents\UNP\8-K_2023-02-21' --> 'data\processed_data\UNP\8-K_2023-02-21.md'


2025-11-14 17:49:10,534 - INFO - Processing document 8-K_2023-02-27
2025-11-14 17:49:10,551 - INFO - Finished converting document 8-K_2023-02-27 in 0.05 sec.
2025-11-14 17:49:10,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:10,588 - INFO - Going to convert document batch...
2025-11-14 17:49:10,589 - INFO - Processing document 8-K_2023-04-20
2025-11-14 17:49:10,617 - INFO - Finished converting document 8-K_2023-04-20 in 0.05 sec.
2025-11-14 17:49:10,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:10,687 - INFO - Going to convert document batch...
2025-11-14 17:49:10,688 - INFO - Processing document 8-K_2023-05-19
2025-11-14 17:49:10,928 - INFO - Finished converting document 8-K_2023-05-19 in 0.30 sec.


Converted 'data\edgar_documents\UNP\8-K_2023-02-27' --> 'data\processed_data\UNP\8-K_2023-02-27.md'
Converted 'data\edgar_documents\UNP\8-K_2023-04-20' --> 'data\processed_data\UNP\8-K_2023-04-20.md'


2025-11-14 17:49:10,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:10,978 - INFO - Going to convert document batch...
2025-11-14 17:49:10,979 - INFO - Processing document 8-K_2023-06-13
2025-11-14 17:49:10,994 - INFO - Finished converting document 8-K_2023-06-13 in 0.05 sec.
2025-11-14 17:49:11,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,031 - INFO - Going to convert document batch...
2025-11-14 17:49:11,032 - INFO - Processing document 8-K_2023-07-26
2025-11-14 17:49:11,054 - INFO - Finished converting document 8-K_2023-07-26 in 0.05 sec.
2025-11-14 17:49:11,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,096 - INFO - Going to convert document batch...
2025-11-14 17:49:11,097 - INFO - Processing document 8-K_2023-08-11
2025-11-14 17:49:11,117 - INFO - Finished converting document 8-K_2023-08-11 in 0.05 sec.


Converted 'data\edgar_documents\UNP\8-K_2023-05-19' --> 'data\processed_data\UNP\8-K_2023-05-19.md'
Converted 'data\edgar_documents\UNP\8-K_2023-06-13' --> 'data\processed_data\UNP\8-K_2023-06-13.md'
Converted 'data\edgar_documents\UNP\8-K_2023-07-26' --> 'data\processed_data\UNP\8-K_2023-07-26.md'


2025-11-14 17:49:11,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,152 - INFO - Going to convert document batch...
2025-11-14 17:49:11,153 - INFO - Processing document 8-K_2023-09-29
2025-11-14 17:49:11,168 - INFO - Finished converting document 8-K_2023-09-29 in 0.05 sec.
2025-11-14 17:49:11,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,206 - INFO - Going to convert document batch...
2025-11-14 17:49:11,207 - INFO - Processing document 8-K_2023-10-19
2025-11-14 17:49:11,224 - INFO - Finished converting document 8-K_2023-10-19 in 0.05 sec.
2025-11-14 17:49:11,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,262 - INFO - Going to convert document batch...
2025-11-14 17:49:11,262 - INFO - Processing document 8-K_2023-12-14
2025-11-14 17:49:11,280 - INFO - Finished converting document 8-K_2023-12-14 in 0.05 sec.
2025-11-14 17:49:11,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\UNP\8-K_2023-08-11' --> 'data\processed_data\UNP\8-K_2023-08-11.md'
Converted 'data\edgar_documents\UNP\8-K_2023-09-29' --> 'data\processed_data\UNP\8-K_2023-09-29.md'
Converted 'data\edgar_documents\UNP\8-K_2023-10-19' --> 'data\processed_data\UNP\8-K_2023-10-19.md'
Converted 'data\edgar_documents\UNP\8-K_2023-12-14' --> 'data\processed_data\UNP\8-K_2023-12-14.md'


2025-11-14 17:49:11,314 - INFO - Processing document 8-K_2024-01-25
2025-11-14 17:49:11,329 - INFO - Finished converting document 8-K_2024-01-25 in 0.05 sec.
2025-11-14 17:49:11,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,362 - INFO - Going to convert document batch...
2025-11-14 17:49:11,363 - INFO - Processing document 8-K_2024-04-25
2025-11-14 17:49:11,381 - INFO - Finished converting document 8-K_2024-04-25 in 0.05 sec.
2025-11-14 17:49:11,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,428 - INFO - Going to convert document batch...
2025-11-14 17:49:11,429 - INFO - Processing document 8-K_2024-05-10
2025-11-14 17:49:11,457 - INFO - Finished converting document 8-K_2024-05-10 in 0.06 sec.
2025-11-14 17:49:11,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,496 - INFO - Going to convert document batch...
2025-11-14 17:49:11,497 - INFO - Processing document 8-K_2024-07-25


Converted 'data\edgar_documents\UNP\8-K_2024-01-25' --> 'data\processed_data\UNP\8-K_2024-01-25.md'
Converted 'data\edgar_documents\UNP\8-K_2024-04-25' --> 'data\processed_data\UNP\8-K_2024-04-25.md'
Converted 'data\edgar_documents\UNP\8-K_2024-05-10' --> 'data\processed_data\UNP\8-K_2024-05-10.md'


2025-11-14 17:49:11,515 - INFO - Finished converting document 8-K_2024-07-25 in 0.05 sec.
2025-11-14 17:49:11,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,550 - INFO - Going to convert document batch...
2025-11-14 17:49:11,551 - INFO - Processing document 8-K_2024-09-19
2025-11-14 17:49:11,588 - INFO - Finished converting document 8-K_2024-09-19 in 0.08 sec.
2025-11-14 17:49:11,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,641 - INFO - Going to convert document batch...
2025-11-14 17:49:11,642 - INFO - Processing document 8-K_2024-10-24
2025-11-14 17:49:11,662 - INFO - Finished converting document 8-K_2024-10-24 in 0.06 sec.
2025-11-14 17:49:11,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,695 - INFO - Going to convert document batch...
2025-11-14 17:49:11,695 - INFO - Processing document 8-K_2025-01-23
2025-11-14 17:49:11,710 - INFO - Finished converting document 8-K_2025-01-23 in 0.

Converted 'data\edgar_documents\UNP\8-K_2024-07-25' --> 'data\processed_data\UNP\8-K_2024-07-25.md'
Converted 'data\edgar_documents\UNP\8-K_2024-09-19' --> 'data\processed_data\UNP\8-K_2024-09-19.md'
Converted 'data\edgar_documents\UNP\8-K_2024-10-24' --> 'data\processed_data\UNP\8-K_2024-10-24.md'


2025-11-14 17:49:11,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,744 - INFO - Going to convert document batch...
2025-11-14 17:49:11,744 - INFO - Processing document 8-K_2025-02-13
2025-11-14 17:49:11,764 - INFO - Finished converting document 8-K_2025-02-13 in 0.05 sec.
2025-11-14 17:49:11,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,798 - INFO - Going to convert document batch...
2025-11-14 17:49:11,798 - INFO - Processing document 8-K_2025-02-18
2025-11-14 17:49:11,814 - INFO - Finished converting document 8-K_2025-02-18 in 0.03 sec.
2025-11-14 17:49:11,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,857 - INFO - Going to convert document batch...
2025-11-14 17:49:11,860 - INFO - Processing document 8-K_2025-04-24
2025-11-14 17:49:11,877 - INFO - Finished converting document 8-K_2025-04-24 in 0.05 sec.
2025-11-14 17:49:11,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\8-K_2025-01-23' --> 'data\processed_data\UNP\8-K_2025-01-23.md'
Converted 'data\edgar_documents\UNP\8-K_2025-02-13' --> 'data\processed_data\UNP\8-K_2025-02-13.md'
Converted 'data\edgar_documents\UNP\8-K_2025-02-18' --> 'data\processed_data\UNP\8-K_2025-02-18.md'
Converted 'data\edgar_documents\UNP\8-K_2025-04-24' --> 'data\processed_data\UNP\8-K_2025-04-24.md'


2025-11-14 17:49:11,914 - INFO - Going to convert document batch...
2025-11-14 17:49:11,915 - INFO - Processing document 8-K_2025-05-09
2025-11-14 17:49:11,938 - INFO - Finished converting document 8-K_2025-05-09 in 0.05 sec.
2025-11-14 17:49:11,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:11,968 - INFO - Going to convert document batch...
2025-11-14 17:49:11,969 - INFO - Processing document 8-K_2025-07-24
2025-11-14 17:49:11,984 - INFO - Finished converting document 8-K_2025-07-24 in 0.03 sec.
2025-11-14 17:49:12,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:12,019 - INFO - Going to convert document batch...
2025-11-14 17:49:12,020 - INFO - Processing document 8-K_2025-07-29
2025-11-14 17:49:12,039 - INFO - Finished converting document 8-K_2025-07-29 in 0.03 sec.
2025-11-14 17:49:12,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:12,071 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\UNP\8-K_2025-05-09' --> 'data\processed_data\UNP\8-K_2025-05-09.md'
Converted 'data\edgar_documents\UNP\8-K_2025-07-24' --> 'data\processed_data\UNP\8-K_2025-07-24.md'
Converted 'data\edgar_documents\UNP\8-K_2025-07-29' --> 'data\processed_data\UNP\8-K_2025-07-29.md'
Converted 'data\edgar_documents\UNP\8-K_2025-09-10' --> 'data\processed_data\UNP\8-K_2025-09-10.md'
Converted 'data\edgar_documents\UNP\8-K_2025-10-23' --> 'data\processed_data\UNP\8-K_2025-10-23.md'


2025-11-14 17:49:12,190 - INFO - Going to convert document batch...
2025-11-14 17:49:12,193 - INFO - Processing document 8-K_2025-11-06
2025-11-14 17:49:12,268 - INFO - Finished converting document 8-K_2025-11-06 in 0.12 sec.
2025-11-14 17:49:12,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UNP\8-K_2025-11-06' --> 'data\processed_data\UNP\8-K_2025-11-06.md'


2025-11-14 17:49:13,058 - INFO - Going to convert document batch...
2025-11-14 17:49:13,059 - INFO - Processing document DEF-14A_2023-04-05
2025-11-14 17:49:18,434 - INFO - Finished converting document DEF-14A_2023-04-05 in 6.16 sec.
2025-11-14 17:49:19,059 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:19,060 - ERROR - Input document DEF-14A_2024-03-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:19,062 - INFO - Going to 

Converted 'data\edgar_documents\UNP\DEF-14A_2023-04-05' --> 'data\processed_data\UNP\DEF-14A_2023-04-05.md'
Error processing data\edgar_documents\UNP\DEF-14A_2024-03-26: File format not allowed: data\edgar_documents\UNP\DEF-14A_2024-03-26
Error processing data\edgar_documents\UNP\DEF-14A_2025-03-25: File format not allowed: data\edgar_documents\UNP\DEF-14A_2025-03-25
Processed 103 new files. Errors: 57
Found 92 files to process in data\edgar_documents\UPS


2025-11-14 17:49:19,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:20,526 - INFO - Going to convert document batch...
2025-11-14 17:49:20,527 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:49:20,528 - INFO - Processing document 10-K_2023-02-21
2025-11-14 17:49:23,041 - INFO - Finished converting document 10-K_2023-02-21 in 3.92 sec.
2025-11-14 17:49:23,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\10-K_2023-02-21' --> 'data\processed_data\UPS\10-K_2023-02-21.md'


2025-11-14 17:49:25,252 - INFO - Going to convert document batch...
2025-11-14 17:49:25,254 - INFO - Processing document 10-K_2024-02-20
2025-11-14 17:49:27,609 - INFO - Finished converting document 10-K_2024-02-20 in 3.83 sec.
2025-11-14 17:49:28,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\10-K_2024-02-20' --> 'data\processed_data\UPS\10-K_2024-02-20.md'


2025-11-14 17:49:29,905 - INFO - Going to convert document batch...
2025-11-14 17:49:29,907 - INFO - Processing document 10-K_2025-02-18
2025-11-14 17:49:32,274 - INFO - Finished converting document 10-K_2025-02-18 in 3.94 sec.
2025-11-14 17:49:33,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\10-K_2025-02-18' --> 'data\processed_data\UPS\10-K_2025-02-18.md'


2025-11-14 17:49:33,640 - INFO - Going to convert document batch...
2025-11-14 17:49:33,641 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 17:49:35,164 - INFO - Finished converting document 10-Q_2023-05-03 in 2.12 sec.
2025-11-14 17:49:35,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\10-Q_2023-05-03' --> 'data\processed_data\UPS\10-Q_2023-05-03.md'


2025-11-14 17:49:36,505 - INFO - Going to convert document batch...
2025-11-14 17:49:36,506 - INFO - Processing document 10-Q_2023-08-08
2025-11-14 17:49:37,764 - INFO - Finished converting document 10-Q_2023-08-08 in 2.08 sec.
2025-11-14 17:49:38,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\10-Q_2023-08-08' --> 'data\processed_data\UPS\10-Q_2023-08-08.md'


2025-11-14 17:49:39,576 - INFO - Going to convert document batch...
2025-11-14 17:49:39,576 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 17:49:40,847 - INFO - Finished converting document 10-Q_2023-11-01 in 2.45 sec.
2025-11-14 17:49:41,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\10-Q_2023-11-01' --> 'data\processed_data\UPS\10-Q_2023-11-01.md'


2025-11-14 17:49:42,448 - INFO - Going to convert document batch...
2025-11-14 17:49:42,448 - INFO - Processing document 10-Q_2024-05-03
2025-11-14 17:49:43,450 - INFO - Finished converting document 10-Q_2024-05-03 in 1.89 sec.
2025-11-14 17:49:44,086 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:44,087 - ERROR - Input document 10-Q_2024-08-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:44,092 - INFO - Going to convert d

Converted 'data\edgar_documents\UPS\10-Q_2024-05-03' --> 'data\processed_data\UPS\10-Q_2024-05-03.md'
Error processing data\edgar_documents\UPS\10-Q_2024-08-07: File format not allowed: data\edgar_documents\UPS\10-Q_2024-08-07


2025-11-14 17:49:45,130 - INFO - Going to convert document batch...
2025-11-14 17:49:45,131 - INFO - Processing document 10-Q_2024-11-06
2025-11-14 17:49:46,576 - INFO - Finished converting document 10-Q_2024-11-06 in 2.48 sec.
2025-11-14 17:49:47,206 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\10-Q_2024-11-06' --> 'data\processed_data\UPS\10-Q_2024-11-06.md'


2025-11-14 17:49:48,002 - INFO - Going to convert document batch...
2025-11-14 17:49:48,003 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 17:49:49,081 - INFO - Finished converting document 10-Q_2025-05-07 in 1.91 sec.
2025-11-14 17:49:49,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\10-Q_2025-05-07' --> 'data\processed_data\UPS\10-Q_2025-05-07.md'


2025-11-14 17:49:50,332 - INFO - Going to convert document batch...
2025-11-14 17:49:50,333 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 17:49:52,100 - INFO - Finished converting document 10-Q_2025-08-06 in 2.45 sec.
2025-11-14 17:49:52,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\10-Q_2025-08-06' --> 'data\processed_data\UPS\10-Q_2025-08-06.md'


2025-11-14 17:49:53,401 - INFO - Going to convert document batch...
2025-11-14 17:49:53,401 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 17:49:54,748 - INFO - Finished converting document 10-Q_2025-11-05 in 2.08 sec.
2025-11-14 17:49:55,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:55,784 - INFO - Going to convert document batch...
2025-11-14 17:49:55,786 - INFO - Processing document 4_2023-01-06
2025-11-14 17:49:55,804 - INFO - Finished converting document 4_2023-01-06 in 0.03 sec.
2025-11-14 17:49:55,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:55,864 - INFO - Going to convert document batch...
2025-11-14 17:49:55,865 - INFO - Processing document 4_2023-01-27
2025-11-14 17:49:55,884 - INFO - Finished converting document 4_2023-01-27 in 0.05 sec.
2025-11-14 17:49:55,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:55,951 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\UPS\10-Q_2025-11-05' --> 'data\processed_data\UPS\10-Q_2025-11-05.md'
Converted 'data\edgar_documents\UPS\4_2023-01-06' --> 'data\processed_data\UPS\4_2023-01-06.md'
Converted 'data\edgar_documents\UPS\4_2023-01-27' --> 'data\processed_data\UPS\4_2023-01-27.md'


2025-11-14 17:49:55,952 - INFO - Processing document 4_2023-02-03
2025-11-14 17:49:55,992 - INFO - Finished converting document 4_2023-02-03 in 0.08 sec.
2025-11-14 17:49:56,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:56,045 - INFO - Going to convert document batch...
2025-11-14 17:49:56,047 - INFO - Processing document 4_2023-02-10
2025-11-14 17:49:56,067 - INFO - Finished converting document 4_2023-02-10 in 0.05 sec.
2025-11-14 17:49:56,121 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:56,136 - INFO - Going to convert document batch...
2025-11-14 17:49:56,137 - INFO - Processing document 4_2023-02-16
2025-11-14 17:49:56,155 - INFO - Finished converting document 4_2023-02-16 in 0.06 sec.
2025-11-14 17:49:56,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:56,201 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\UPS\4_2023-02-03' --> 'data\processed_data\UPS\4_2023-02-03.md'
Converted 'data\edgar_documents\UPS\4_2023-02-10' --> 'data\processed_data\UPS\4_2023-02-10.md'
Converted 'data\edgar_documents\UPS\4_2023-02-16' --> 'data\processed_data\UPS\4_2023-02-16.md'


2025-11-14 17:49:56,202 - INFO - Processing document 4_2023-02-22
2025-11-14 17:49:56,237 - INFO - Finished converting document 4_2023-02-22 in 0.06 sec.
2025-11-14 17:49:56,288 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:56,290 - ERROR - Input document 4_2023-02-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:56,291 - INFO - Going to convert document batch...
2025-11-14 17:49:56,307 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\UPS\4_2023-02-22' --> 'data\processed_data\UPS\4_2023-02-22.md'
Error processing data\edgar_documents\UPS\4_2023-02-23: File format not allowed: data\edgar_documents\UPS\4_2023-02-23
Error processing data\edgar_documents\UPS\4_2023-02-24: File format not allowed: data\edgar_documents\UPS\4_2023-02-24
Error processing data\edgar_documents\UPS\4_2023-02-28: File format not allowed: data\edgar_documents\UPS\4_2023-02-28
Error processing data\edgar_documents\UPS\4_2023-03-02: File format not allowed: data\edgar_documents\UPS\4_2023-03-02
Converted 'data\edgar_documents\UPS\4_2023-03-29' --> 'data\processed_data\UPS\4_2023-03-29.md'


2025-11-14 17:49:56,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:56,516 - INFO - Going to convert document batch...
2025-11-14 17:49:56,517 - INFO - Processing document 4_2023-05-05
2025-11-14 17:49:56,542 - INFO - Finished converting document 4_2023-05-05 in 0.06 sec.
2025-11-14 17:49:56,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:56,617 - INFO - Going to convert document batch...
2025-11-14 17:49:56,619 - INFO - Processing document 4_2023-05-08
2025-11-14 17:49:56,646 - INFO - Finished converting document 4_2023-05-08 in 0.06 sec.


Converted 'data\edgar_documents\UPS\4_2023-04-06' --> 'data\processed_data\UPS\4_2023-04-06.md'
Converted 'data\edgar_documents\UPS\4_2023-05-05' --> 'data\processed_data\UPS\4_2023-05-05.md'
Converted 'data\edgar_documents\UPS\4_2023-05-08' --> 'data\processed_data\UPS\4_2023-05-08.md'


2025-11-14 17:49:56,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:56,703 - INFO - Going to convert document batch...
2025-11-14 17:49:56,704 - INFO - Processing document 4_2023-05-16
2025-11-14 17:49:56,741 - INFO - Finished converting document 4_2023-05-16 in 0.06 sec.
2025-11-14 17:49:56,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:56,820 - INFO - Going to convert document batch...
2025-11-14 17:49:56,821 - INFO - Processing document 4_2023-07-21
2025-11-14 17:49:56,845 - INFO - Finished converting document 4_2023-07-21 in 0.06 sec.
2025-11-14 17:49:56,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:56,887 - INFO - Going to convert document batch...
2025-11-14 17:49:56,888 - INFO - Processing document 4_2023-08-04
2025-11-14 17:49:56,908 - INFO - Finished converting document 4_2023-08-04 in 0.05 sec.
2025-11-14 17:49:56,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\UPS\4_2023-05-16' --> 'data\processed_data\UPS\4_2023-05-16.md'
Converted 'data\edgar_documents\UPS\4_2023-07-21' --> 'data\processed_data\UPS\4_2023-07-21.md'
Converted 'data\edgar_documents\UPS\4_2023-08-04' --> 'data\processed_data\UPS\4_2023-08-04.md'


2025-11-14 17:49:56,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,006 - INFO - Going to convert document batch...
2025-11-14 17:49:57,007 - INFO - Processing document 4_2023-08-16
2025-11-14 17:49:57,031 - INFO - Finished converting document 4_2023-08-16 in 0.05 sec.
2025-11-14 17:49:57,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,096 - INFO - Going to convert document batch...
2025-11-14 17:49:57,097 - INFO - Processing document 4_2023-11-03
2025-11-14 17:49:57,126 - INFO - Finished converting document 4_2023-11-03 in 0.06 sec.
2025-11-14 17:49:57,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,172 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\UPS\4_2023-08-11' --> 'data\processed_data\UPS\4_2023-08-11.md'
Converted 'data\edgar_documents\UPS\4_2023-08-16' --> 'data\processed_data\UPS\4_2023-08-16.md'
Converted 'data\edgar_documents\UPS\4_2023-11-03' --> 'data\processed_data\UPS\4_2023-11-03.md'


2025-11-14 17:49:57,173 - INFO - Processing document 4_2023-11-15
2025-11-14 17:49:57,195 - INFO - Finished converting document 4_2023-11-15 in 0.05 sec.
2025-11-14 17:49:57,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,237 - INFO - Going to convert document batch...
2025-11-14 17:49:57,238 - INFO - Processing document 4_2024-02-05
2025-11-14 17:49:57,258 - INFO - Finished converting document 4_2024-02-05 in 0.03 sec.
2025-11-14 17:49:57,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,297 - INFO - Going to convert document batch...
2025-11-14 17:49:57,298 - INFO - Processing document 4_2024-02-09
2025-11-14 17:49:57,318 - INFO - Finished converting document 4_2024-02-09 in 0.03 sec.
2025-11-14 17:49:57,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,359 - INFO - Going to convert document batch...
2025-11-14 17:49:57,360 - INFO - Processing document 4_2024-02-21
2025-11-14 17:49:57,388 - IN

Converted 'data\edgar_documents\UPS\4_2023-11-15' --> 'data\processed_data\UPS\4_2023-11-15.md'
Converted 'data\edgar_documents\UPS\4_2024-02-05' --> 'data\processed_data\UPS\4_2024-02-05.md'
Converted 'data\edgar_documents\UPS\4_2024-02-09' --> 'data\processed_data\UPS\4_2024-02-09.md'


2025-11-14 17:49:57,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,433 - INFO - Going to convert document batch...
2025-11-14 17:49:57,434 - INFO - Processing document 4_2024-03-22
2025-11-14 17:49:57,452 - INFO - Finished converting document 4_2024-03-22 in 0.05 sec.
2025-11-14 17:49:57,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,504 - INFO - Going to convert document batch...
2025-11-14 17:49:57,505 - INFO - Processing document 4_2024-03-27
2025-11-14 17:49:57,531 - INFO - Finished converting document 4_2024-03-27 in 0.06 sec.
2025-11-14 17:49:57,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,573 - INFO - Going to convert document batch...
2025-11-14 17:49:57,574 - INFO - Processing document 4_2024-05-03
2025-11-14 17:49:57,593 - INFO - Finished converting document 4_2024-05-03 in 0.05 sec.


Converted 'data\edgar_documents\UPS\4_2024-02-21' --> 'data\processed_data\UPS\4_2024-02-21.md'
Converted 'data\edgar_documents\UPS\4_2024-03-22' --> 'data\processed_data\UPS\4_2024-03-22.md'
Converted 'data\edgar_documents\UPS\4_2024-03-27' --> 'data\processed_data\UPS\4_2024-03-27.md'


2025-11-14 17:49:57,632 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:57,633 - ERROR - Input document 4_2024-05-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:57,634 - INFO - Going to convert document batch...
2025-11-14 17:49:57,653 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:57,654 - ERROR - Input document 4_2024-05-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\UPS\4_2024-05-03' --> 'data\processed_data\UPS\4_2024-05-03.md'
Error processing data\edgar_documents\UPS\4_2024-05-20: File format not allowed: data\edgar_documents\UPS\4_2024-05-20
Error processing data\edgar_documents\UPS\4_2024-05-21: File format not allowed: data\edgar_documents\UPS\4_2024-05-21
Error processing data\edgar_documents\UPS\4_2024-05-22: File format not allowed: data\edgar_documents\UPS\4_2024-05-22
Error processing data\edgar_documents\UPS\4_2024-05-23: File format not allowed: data\edgar_documents\UPS\4_2024-05-23
Converted 'data\edgar_documents\UPS\4_2024-07-19' --> 'data\processed_data\UPS\4_2024-07-19.md'


2025-11-14 17:49:57,793 - INFO - Processing document 4_2024-07-25
2025-11-14 17:49:57,810 - INFO - Finished converting document 4_2024-07-25 in 0.05 sec.
2025-11-14 17:49:57,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,873 - INFO - Going to convert document batch...
2025-11-14 17:49:57,874 - INFO - Processing document 4_2024-08-09
2025-11-14 17:49:57,901 - INFO - Finished converting document 4_2024-08-09 in 0.06 sec.
2025-11-14 17:49:57,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:57,939 - INFO - Going to convert document batch...
2025-11-14 17:49:57,940 - INFO - Processing document 4_2024-11-08
2025-11-14 17:49:57,963 - INFO - Finished converting document 4_2024-11-08 in 0.05 sec.
2025-11-14 17:49:57,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,005 - INFO - Going to convert document batch...
2025-11-14 17:49:58,005 - INFO - Processing document 4_2024-11-27
2025-11-14 17:49:58,024 - IN

Converted 'data\edgar_documents\UPS\4_2024-07-25' --> 'data\processed_data\UPS\4_2024-07-25.md'
Converted 'data\edgar_documents\UPS\4_2024-08-09' --> 'data\processed_data\UPS\4_2024-08-09.md'
Converted 'data\edgar_documents\UPS\4_2024-11-08' --> 'data\processed_data\UPS\4_2024-11-08.md'


2025-11-14 17:49:58,054 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,064 - INFO - Going to convert document batch...
2025-11-14 17:49:58,064 - INFO - Processing document 4_2025-02-04
2025-11-14 17:49:58,088 - INFO - Finished converting document 4_2025-02-04 in 0.05 sec.
2025-11-14 17:49:58,124 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,133 - INFO - Going to convert document batch...
2025-11-14 17:49:58,133 - INFO - Processing document 4_2025-02-07
2025-11-14 17:49:58,152 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.
2025-11-14 17:49:58,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,191 - INFO - Going to convert document batch...
2025-11-14 17:49:58,192 - INFO - Processing document 4_2025-02-18
2025-11-14 17:49:58,213 - INFO - Finished converting document 4_2025-02-18 in 0.03 sec.


Converted 'data\edgar_documents\UPS\4_2024-11-27' --> 'data\processed_data\UPS\4_2024-11-27.md'
Converted 'data\edgar_documents\UPS\4_2025-02-04' --> 'data\processed_data\UPS\4_2025-02-04.md'
Converted 'data\edgar_documents\UPS\4_2025-02-07' --> 'data\processed_data\UPS\4_2025-02-07.md'


2025-11-14 17:49:58,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,254 - INFO - Going to convert document batch...
2025-11-14 17:49:58,255 - INFO - Processing document 4_2025-03-04
2025-11-14 17:49:58,277 - INFO - Finished converting document 4_2025-03-04 in 0.05 sec.
2025-11-14 17:49:58,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,336 - INFO - Going to convert document batch...
2025-11-14 17:49:58,337 - INFO - Processing document 4_2025-03-25
2025-11-14 17:49:58,358 - INFO - Finished converting document 4_2025-03-25 in 0.06 sec.
2025-11-14 17:49:58,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,417 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\UPS\4_2025-02-18' --> 'data\processed_data\UPS\4_2025-02-18.md'
Converted 'data\edgar_documents\UPS\4_2025-03-04' --> 'data\processed_data\UPS\4_2025-03-04.md'
Converted 'data\edgar_documents\UPS\4_2025-03-25' --> 'data\processed_data\UPS\4_2025-03-25.md'


2025-11-14 17:49:58,418 - INFO - Processing document 4_2025-05-09
2025-11-14 17:49:58,441 - INFO - Finished converting document 4_2025-05-09 in 0.06 sec.
2025-11-14 17:49:58,488 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:49:58,490 - ERROR - Input document 4_2025-05-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:49:58,492 - INFO - Going to convert document batch...
2025-11-14 17:49:58,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49

Converted 'data\edgar_documents\UPS\4_2025-05-09' --> 'data\processed_data\UPS\4_2025-05-09.md'
Error processing data\edgar_documents\UPS\4_2025-05-12: File format not allowed: data\edgar_documents\UPS\4_2025-05-12
Converted 'data\edgar_documents\UPS\4_2025-05-13' --> 'data\processed_data\UPS\4_2025-05-13.md'
Error processing data\edgar_documents\UPS\4_2025-05-14: File format not allowed: data\edgar_documents\UPS\4_2025-05-14
Error processing data\edgar_documents\UPS\4_2025-05-15: File format not allowed: data\edgar_documents\UPS\4_2025-05-15


2025-11-14 17:49:58,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,696 - INFO - Going to convert document batch...
2025-11-14 17:49:58,697 - INFO - Processing document 4_2025-08-01
2025-11-14 17:49:58,727 - INFO - Finished converting document 4_2025-08-01 in 0.05 sec.
2025-11-14 17:49:58,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,780 - INFO - Going to convert document batch...
2025-11-14 17:49:58,781 - INFO - Processing document 4_2025-08-07
2025-11-14 17:49:58,815 - INFO - Finished converting document 4_2025-08-07 in 0.06 sec.
2025-11-14 17:49:58,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\4_2025-06-03' --> 'data\processed_data\UPS\4_2025-06-03.md'
Converted 'data\edgar_documents\UPS\4_2025-08-01' --> 'data\processed_data\UPS\4_2025-08-01.md'
Converted 'data\edgar_documents\UPS\4_2025-08-07' --> 'data\processed_data\UPS\4_2025-08-07.md'


2025-11-14 17:49:58,865 - INFO - Going to convert document batch...
2025-11-14 17:49:58,865 - INFO - Processing document 4_2025-08-26
2025-11-14 17:49:58,886 - INFO - Finished converting document 4_2025-08-26 in 0.05 sec.
2025-11-14 17:49:58,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:58,926 - INFO - Going to convert document batch...
2025-11-14 17:49:58,926 - INFO - Processing document 4_2025-11-07
2025-11-14 17:49:58,947 - INFO - Finished converting document 4_2025-11-07 in 0.03 sec.
2025-11-14 17:49:58,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,000 - INFO - Going to convert document batch...
2025-11-14 17:49:59,001 - INFO - Processing document 8-K_2023-01-31
2025-11-14 17:49:59,019 - INFO - Finished converting document 8-K_2023-01-31 in 0.05 sec.
2025-11-14 17:49:59,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,075 - INFO - Going to convert document batch...
2025-11-14 17:49:59,07

Converted 'data\edgar_documents\UPS\4_2025-08-26' --> 'data\processed_data\UPS\4_2025-08-26.md'
Converted 'data\edgar_documents\UPS\4_2025-11-07' --> 'data\processed_data\UPS\4_2025-11-07.md'
Converted 'data\edgar_documents\UPS\8-K_2023-01-31' --> 'data\processed_data\UPS\8-K_2023-01-31.md'


2025-11-14 17:49:59,113 - INFO - Finished converting document 8-K_2023-02-27 in 0.08 sec.
2025-11-14 17:49:59,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,154 - INFO - Going to convert document batch...
2025-11-14 17:49:59,155 - INFO - Processing document 8-K_2023-03-07
2025-11-14 17:49:59,180 - INFO - Finished converting document 8-K_2023-03-07 in 0.05 sec.
2025-11-14 17:49:59,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,226 - INFO - Going to convert document batch...
2025-11-14 17:49:59,228 - INFO - Processing document 8-K_2023-04-25
2025-11-14 17:49:59,248 - INFO - Finished converting document 8-K_2023-04-25 in 0.06 sec.
2025-11-14 17:49:59,274 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,307 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\UPS\8-K_2023-02-27' --> 'data\processed_data\UPS\8-K_2023-02-27.md'
Converted 'data\edgar_documents\UPS\8-K_2023-03-07' --> 'data\processed_data\UPS\8-K_2023-03-07.md'
Converted 'data\edgar_documents\UPS\8-K_2023-04-25' --> 'data\processed_data\UPS\8-K_2023-04-25.md'


2025-11-14 17:49:59,308 - INFO - Processing document 8-K_2023-05-09
2025-11-14 17:49:59,366 - INFO - Finished converting document 8-K_2023-05-09 in 0.09 sec.
2025-11-14 17:49:59,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,445 - INFO - Going to convert document batch...
2025-11-14 17:49:59,446 - INFO - Processing document 8-K_2023-08-08
2025-11-14 17:49:59,464 - INFO - Finished converting document 8-K_2023-08-08 in 0.08 sec.
2025-11-14 17:49:59,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,502 - INFO - Going to convert document batch...
2025-11-14 17:49:59,503 - INFO - Processing document 8-K_2023-09-11
2025-11-14 17:49:59,521 - INFO - Finished converting document 8-K_2023-09-11 in 0.05 sec.
2025-11-14 17:49:59,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,560 - INFO - Going to convert document batch...
2025-11-14 17:49:59,561 - INFO - Processing document 8-K_2023-10-26
2025-11-14 17:

Converted 'data\edgar_documents\UPS\8-K_2023-05-09' --> 'data\processed_data\UPS\8-K_2023-05-09.md'
Converted 'data\edgar_documents\UPS\8-K_2023-08-08' --> 'data\processed_data\UPS\8-K_2023-08-08.md'
Converted 'data\edgar_documents\UPS\8-K_2023-09-11' --> 'data\processed_data\UPS\8-K_2023-09-11.md'


2025-11-14 17:49:59,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,614 - INFO - Going to convert document batch...
2025-11-14 17:49:59,615 - INFO - Processing document 8-K_2024-01-30
2025-11-14 17:49:59,634 - INFO - Finished converting document 8-K_2024-01-30 in 0.03 sec.
2025-11-14 17:49:59,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,669 - INFO - Going to convert document batch...
2025-11-14 17:49:59,670 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:49:59,706 - INFO - Finished converting document 8-K_2024-04-23 in 0.06 sec.
2025-11-14 17:49:59,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,777 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\UPS\8-K_2023-10-26' --> 'data\processed_data\UPS\8-K_2023-10-26.md'
Converted 'data\edgar_documents\UPS\8-K_2024-01-30' --> 'data\processed_data\UPS\8-K_2024-01-30.md'
Converted 'data\edgar_documents\UPS\8-K_2024-04-23' --> 'data\processed_data\UPS\8-K_2024-04-23.md'


2025-11-14 17:49:59,778 - INFO - Processing document 8-K_2024-05-06
2025-11-14 17:49:59,822 - INFO - Finished converting document 8-K_2024-05-06 in 0.09 sec.
2025-11-14 17:49:59,861 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,873 - INFO - Going to convert document batch...
2025-11-14 17:49:59,874 - INFO - Processing document 8-K_2024-05-22
2025-11-14 17:49:59,898 - INFO - Finished converting document 8-K_2024-05-22 in 0.05 sec.
2025-11-14 17:49:59,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:49:59,941 - INFO - Going to convert document batch...
2025-11-14 17:49:59,942 - INFO - Processing document 8-K_2024-05-28
2025-11-14 17:49:59,967 - INFO - Finished converting document 8-K_2024-05-28 in 0.06 sec.
2025-11-14 17:49:59,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:00,008 - INFO - Going to convert document batch...
2025-11-14 17:50:00,009 - INFO - Processing document 8-K_2024-07-09
2025-11-14 17:

Converted 'data\edgar_documents\UPS\8-K_2024-05-06' --> 'data\processed_data\UPS\8-K_2024-05-06.md'
Converted 'data\edgar_documents\UPS\8-K_2024-05-22' --> 'data\processed_data\UPS\8-K_2024-05-22.md'
Converted 'data\edgar_documents\UPS\8-K_2024-05-28' --> 'data\processed_data\UPS\8-K_2024-05-28.md'


2025-11-14 17:50:00,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:00,071 - INFO - Going to convert document batch...
2025-11-14 17:50:00,072 - INFO - Processing document 8-K_2024-07-23
2025-11-14 17:50:00,092 - INFO - Finished converting document 8-K_2024-07-23 in 0.05 sec.
2025-11-14 17:50:00,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:00,150 - INFO - Going to convert document batch...
2025-11-14 17:50:00,151 - INFO - Processing document 8-K_2024-10-24
2025-11-14 17:50:00,174 - INFO - Finished converting document 8-K_2024-10-24 in 0.06 sec.
2025-11-14 17:50:00,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:00,213 - INFO - Going to convert document batch...
2025-11-14 17:50:00,214 - INFO - Processing document 8-K_2025-01-30
2025-11-14 17:50:00,233 - INFO - Finished converting document 8-K_2025-01-30 in 0.05 sec.


Converted 'data\edgar_documents\UPS\8-K_2024-07-09' --> 'data\processed_data\UPS\8-K_2024-07-09.md'
Converted 'data\edgar_documents\UPS\8-K_2024-07-23' --> 'data\processed_data\UPS\8-K_2024-07-23.md'
Converted 'data\edgar_documents\UPS\8-K_2024-10-24' --> 'data\processed_data\UPS\8-K_2024-10-24.md'


2025-11-14 17:50:00,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:00,269 - INFO - Going to convert document batch...
2025-11-14 17:50:00,270 - INFO - Processing document 8-K_2025-03-03
2025-11-14 17:50:00,294 - INFO - Finished converting document 8-K_2025-03-03 in 0.05 sec.
2025-11-14 17:50:00,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:00,329 - INFO - Going to convert document batch...
2025-11-14 17:50:00,330 - INFO - Processing document 8-K_2025-04-29
2025-11-14 17:50:00,351 - INFO - Finished converting document 8-K_2025-04-29 in 0.05 sec.
2025-11-14 17:50:00,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:00,402 - INFO - Going to convert document batch...
2025-11-14 17:50:00,403 - INFO - Processing document 8-K_2025-05-12


Converted 'data\edgar_documents\UPS\8-K_2025-01-30' --> 'data\processed_data\UPS\8-K_2025-01-30.md'
Converted 'data\edgar_documents\UPS\8-K_2025-03-03' --> 'data\processed_data\UPS\8-K_2025-03-03.md'
Converted 'data\edgar_documents\UPS\8-K_2025-04-29' --> 'data\processed_data\UPS\8-K_2025-04-29.md'


2025-11-14 17:50:00,442 - INFO - Finished converting document 8-K_2025-05-12 in 0.08 sec.
2025-11-14 17:50:00,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:00,488 - INFO - Going to convert document batch...
2025-11-14 17:50:00,489 - INFO - Processing document 8-K_2025-05-14
2025-11-14 17:50:00,519 - INFO - Finished converting document 8-K_2025-05-14 in 0.06 sec.
2025-11-14 17:50:00,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:00,588 - INFO - Going to convert document batch...
2025-11-14 17:50:00,589 - INFO - Processing document 8-K_2025-05-20
2025-11-14 17:50:00,614 - INFO - Finished converting document 8-K_2025-05-20 in 0.08 sec.
2025-11-14 17:50:00,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\8-K_2025-05-12' --> 'data\processed_data\UPS\8-K_2025-05-12.md'
Converted 'data\edgar_documents\UPS\8-K_2025-05-14' --> 'data\processed_data\UPS\8-K_2025-05-14.md'
Converted 'data\edgar_documents\UPS\8-K_2025-05-20' --> 'data\processed_data\UPS\8-K_2025-05-20.md'


2025-11-14 17:50:00,654 - INFO - Going to convert document batch...
2025-11-14 17:50:00,655 - INFO - Processing document 8-K_2025-06-02
2025-11-14 17:50:01,102 - INFO - Finished converting document 8-K_2025-06-02 in 0.47 sec.
2025-11-14 17:50:01,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:01,142 - INFO - Going to convert document batch...
2025-11-14 17:50:01,142 - INFO - Processing document 8-K_2025-07-29
2025-11-14 17:50:01,161 - INFO - Finished converting document 8-K_2025-07-29 in 0.05 sec.
2025-11-14 17:50:01,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:01,196 - INFO - Going to convert document batch...
2025-11-14 17:50:01,197 - INFO - Processing document 8-K_2025-09-18
2025-11-14 17:50:01,212 - INFO - Finished converting document 8-K_2025-09-18 in 0.03 sec.
2025-11-14 17:50:01,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:01,243 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\UPS\8-K_2025-06-02' --> 'data\processed_data\UPS\8-K_2025-06-02.md'
Converted 'data\edgar_documents\UPS\8-K_2025-07-29' --> 'data\processed_data\UPS\8-K_2025-07-29.md'
Converted 'data\edgar_documents\UPS\8-K_2025-09-18' --> 'data\processed_data\UPS\8-K_2025-09-18.md'


2025-11-14 17:50:01,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\8-K_2025-10-28' --> 'data\processed_data\UPS\8-K_2025-10-28.md'


2025-11-14 17:50:01,755 - INFO - Going to convert document batch...
2025-11-14 17:50:01,755 - INFO - Processing document DEF-14A_2023-03-20
2025-11-14 17:50:03,222 - INFO - Finished converting document DEF-14A_2023-03-20 in 1.92 sec.
2025-11-14 17:50:03,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\DEF-14A_2023-03-20' --> 'data\processed_data\UPS\DEF-14A_2023-03-20.md'


2025-11-14 17:50:04,277 - INFO - Going to convert document batch...
2025-11-14 17:50:04,277 - INFO - Processing document DEF-14A_2024-03-18
2025-11-14 17:50:05,340 - INFO - Finished converting document DEF-14A_2024-03-18 in 1.62 sec.
2025-11-14 17:50:05,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\UPS\DEF-14A_2024-03-18' --> 'data\processed_data\UPS\DEF-14A_2024-03-18.md'


2025-11-14 17:50:06,185 - INFO - Going to convert document batch...
2025-11-14 17:50:06,186 - INFO - Processing document DEF-14A_2025-03-17
2025-11-14 17:50:07,363 - INFO - Finished converting document DEF-14A_2025-03-17 in 1.55 sec.
2025-11-14 17:50:07,944 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:07,944 - ERROR - Input document 10-K_2023-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:07,946 - INFO - Going to con

Converted 'data\edgar_documents\UPS\DEF-14A_2025-03-17' --> 'data\processed_data\UPS\DEF-14A_2025-03-17.md'
Processed 80 new files. Errors: 12
Found 184 files to process in data\edgar_documents\USB
Error processing data\edgar_documents\USB\10-K_2023-02-27: File format not allowed: data\edgar_documents\USB\10-K_2023-02-27


2025-11-14 17:50:08,516 - INFO - Going to convert document batch...
2025-11-14 17:50:08,517 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:50:08,518 - INFO - Processing document 10-K_2024-02-20
2025-11-14 17:50:08,842 - INFO - Finished converting document 10-K_2024-02-20 in 0.91 sec.
2025-11-14 17:50:08,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\USB\10-K_2024-02-20' --> 'data\processed_data\USB\10-K_2024-02-20.md'


2025-11-14 17:50:09,170 - INFO - Going to convert document batch...
2025-11-14 17:50:09,171 - INFO - Processing document 10-K_2025-02-21
2025-11-14 17:50:09,471 - INFO - Finished converting document 10-K_2025-02-21 in 0.55 sec.
2025-11-14 17:50:09,655 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:09,657 - ERROR - Input document 10-Q_2023-05-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:09,663 - INFO - Going to convert d

Converted 'data\edgar_documents\USB\10-K_2025-02-21' --> 'data\processed_data\USB\10-K_2025-02-21.md'
Error processing data\edgar_documents\USB\10-Q_2023-05-08: File format not allowed: data\edgar_documents\USB\10-Q_2023-05-08


2025-11-14 17:50:09,823 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:09,824 - ERROR - Input document 10-Q_2023-08-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:09,830 - INFO - Going to convert document batch...
2025-11-14 17:50:09,962 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:09,963 - ERROR - Input document 10-Q_2023-11-01 with format None doe

Error processing data\edgar_documents\USB\10-Q_2023-08-07: File format not allowed: data\edgar_documents\USB\10-Q_2023-08-07
Error processing data\edgar_documents\USB\10-Q_2023-11-01: File format not allowed: data\edgar_documents\USB\10-Q_2023-11-01


2025-11-14 17:50:10,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:11,063 - INFO - Going to convert document batch...
2025-11-14 17:50:11,063 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 17:50:13,113 - INFO - Finished converting document 10-Q_2024-05-01 in 3.14 sec.
2025-11-14 17:50:13,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\USB\10-Q_2024-05-01' --> 'data\processed_data\USB\10-Q_2024-05-01.md'


2025-11-14 17:50:15,457 - INFO - Going to convert document batch...
2025-11-14 17:50:15,458 - INFO - Processing document 10-Q_2024-08-06
2025-11-14 17:50:17,911 - INFO - Finished converting document 10-Q_2024-08-06 in 4.11 sec.
2025-11-14 17:50:18,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\USB\10-Q_2024-08-06' --> 'data\processed_data\USB\10-Q_2024-08-06.md'


2025-11-14 17:50:20,514 - INFO - Going to convert document batch...
2025-11-14 17:50:20,515 - INFO - Processing document 10-Q_2024-11-05
2025-11-14 17:50:22,871 - INFO - Finished converting document 10-Q_2024-11-05 in 4.11 sec.
2025-11-14 17:50:23,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\USB\10-Q_2024-11-05' --> 'data\processed_data\USB\10-Q_2024-11-05.md'


2025-11-14 17:50:25,152 - INFO - Going to convert document batch...
2025-11-14 17:50:25,153 - INFO - Processing document 10-Q_2025-05-06
2025-11-14 17:50:27,431 - INFO - Finished converting document 10-Q_2025-05-06 in 3.69 sec.
2025-11-14 17:50:28,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\USB\10-Q_2025-05-06' --> 'data\processed_data\USB\10-Q_2025-05-06.md'


2025-11-14 17:50:29,336 - INFO - Going to convert document batch...
2025-11-14 17:50:29,337 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 17:50:32,193 - INFO - Finished converting document 10-Q_2025-08-07 in 4.03 sec.
2025-11-14 17:50:33,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\USB\10-Q_2025-08-07' --> 'data\processed_data\USB\10-Q_2025-08-07.md'


2025-11-14 17:50:34,804 - INFO - Going to convert document batch...
2025-11-14 17:50:34,805 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 17:50:37,172 - INFO - Finished converting document 10-Q_2025-11-05 in 4.16 sec.
2025-11-14 17:50:38,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:38,035 - INFO - Going to convert document batch...
2025-11-14 17:50:38,035 - INFO - Processing document 4_2023-01-26
2025-11-14 17:50:38,051 - INFO - Finished converting document 4_2023-01-26 in 0.03 sec.
2025-11-14 17:50:38,107 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:38,109 - ERROR - Input document 4_2023-01-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, 

Converted 'data\edgar_documents\USB\10-Q_2025-11-05' --> 'data\processed_data\USB\10-Q_2025-11-05.md'
Converted 'data\edgar_documents\USB\4_2023-01-26' --> 'data\processed_data\USB\4_2023-01-26.md'
Error processing data\edgar_documents\USB\4_2023-01-27: File format not allowed: data\edgar_documents\USB\4_2023-01-27
Converted 'data\edgar_documents\USB\4_2023-02-13' --> 'data\processed_data\USB\4_2023-02-13.md'


2025-11-14 17:50:38,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:38,248 - INFO - Going to convert document batch...
2025-11-14 17:50:38,249 - INFO - Processing document 4_2023-03-07
2025-11-14 17:50:38,266 - INFO - Finished converting document 4_2023-03-07 in 0.03 sec.
2025-11-14 17:50:38,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:38,307 - INFO - Going to convert document batch...
2025-11-14 17:50:38,308 - INFO - Processing document 4_2023-03-09
2025-11-14 17:50:38,329 - INFO - Finished converting document 4_2023-03-09 in 0.05 sec.
2025-11-14 17:50:38,373 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:38,374 - ERROR - Input document 4_2023-04-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\USB\4_2023-03-06' --> 'data\processed_data\USB\4_2023-03-06.md'
Converted 'data\edgar_documents\USB\4_2023-03-07' --> 'data\processed_data\USB\4_2023-03-07.md'
Converted 'data\edgar_documents\USB\4_2023-03-09' --> 'data\processed_data\USB\4_2023-03-09.md'
Error processing data\edgar_documents\USB\4_2023-04-21: File format not allowed: data\edgar_documents\USB\4_2023-04-21


2025-11-14 17:50:38,427 - INFO - Finished converting document 4_2023-04-24 in 0.05 sec.
2025-11-14 17:50:38,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:38,481 - INFO - Going to convert document batch...
2025-11-14 17:50:38,485 - INFO - Processing document 4_2023-05-01
2025-11-14 17:50:38,523 - INFO - Finished converting document 4_2023-05-01 in 0.06 sec.
2025-11-14 17:50:38,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:38,589 - INFO - Going to convert document batch...
2025-11-14 17:50:38,590 - INFO - Processing document 4_2023-05-05
2025-11-14 17:50:38,615 - INFO - Finished converting document 4_2023-05-05 in 0.05 sec.


Converted 'data\edgar_documents\USB\4_2023-04-24' --> 'data\processed_data\USB\4_2023-04-24.md'
Converted 'data\edgar_documents\USB\4_2023-05-01' --> 'data\processed_data\USB\4_2023-05-01.md'
Converted 'data\edgar_documents\USB\4_2023-05-05' --> 'data\processed_data\USB\4_2023-05-05.md'


2025-11-14 17:50:38,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:38,696 - INFO - Going to convert document batch...
2025-11-14 17:50:38,697 - INFO - Processing document 4_2023-05-09
2025-11-14 17:50:38,730 - INFO - Finished converting document 4_2023-05-09 in 0.08 sec.
2025-11-14 17:50:38,790 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:38,791 - ERROR - Input document 4_2023-06-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50

Converted 'data\edgar_documents\USB\4_2023-05-09' --> 'data\processed_data\USB\4_2023-05-09.md'
Error processing data\edgar_documents\USB\4_2023-06-08: File format not allowed: data\edgar_documents\USB\4_2023-06-08
Converted 'data\edgar_documents\USB\4_2023-08-10' --> 'data\processed_data\USB\4_2023-08-10.md'
Converted 'data\edgar_documents\USB\4_2023-08-11' --> 'data\processed_data\USB\4_2023-08-11.md'


2025-11-14 17:50:38,978 - INFO - Going to convert document batch...
2025-11-14 17:50:38,979 - INFO - Processing document 4_2023-10-20
2025-11-14 17:50:39,037 - INFO - Finished converting document 4_2023-10-20 in 0.09 sec.
2025-11-14 17:50:39,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,103 - INFO - Going to convert document batch...
2025-11-14 17:50:39,104 - INFO - Processing document 4_2023-10-24
2025-11-14 17:50:39,124 - INFO - Finished converting document 4_2023-10-24 in 0.05 sec.
2025-11-14 17:50:39,158 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,165 - INFO - Going to convert document batch...
2025-11-14 17:50:39,166 - INFO - Processing document 4_2023-12-11
2025-11-14 17:50:39,185 - INFO - Finished converting document 4_2023-12-11 in 0.05 sec.
2025-11-14 17:50:39,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,238 - INFO - Going to convert document batch...
2025-11-14 17:50:39,238 - 

Converted 'data\edgar_documents\USB\4_2023-10-20' --> 'data\processed_data\USB\4_2023-10-20.md'
Converted 'data\edgar_documents\USB\4_2023-10-24' --> 'data\processed_data\USB\4_2023-10-24.md'
Converted 'data\edgar_documents\USB\4_2023-12-11' --> 'data\processed_data\USB\4_2023-12-11.md'
Converted 'data\edgar_documents\USB\4_2023-12-15' --> 'data\processed_data\USB\4_2023-12-15.md'


2025-11-14 17:50:39,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,310 - INFO - Going to convert document batch...
2025-11-14 17:50:39,311 - INFO - Processing document 4_2023-12-18
2025-11-14 17:50:39,328 - INFO - Finished converting document 4_2023-12-18 in 0.06 sec.
2025-11-14 17:50:39,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,370 - INFO - Going to convert document batch...
2025-11-14 17:50:39,371 - INFO - Processing document 4_2024-01-19
2025-11-14 17:50:39,391 - INFO - Finished converting document 4_2024-01-19 in 0.05 sec.
2025-11-14 17:50:39,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,448 - INFO - Going to convert document batch...
2025-11-14 17:50:39,448 - INFO - Processing document 4_2024-02-01
2025-11-14 17:50:39,468 - INFO - Finished converting document 4_2024-02-01 in 0.06 sec.
2025-11-14 17:50:39,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\USB\4_2023-12-18' --> 'data\processed_data\USB\4_2023-12-18.md'
Converted 'data\edgar_documents\USB\4_2024-01-19' --> 'data\processed_data\USB\4_2024-01-19.md'
Converted 'data\edgar_documents\USB\4_2024-02-01' --> 'data\processed_data\USB\4_2024-02-01.md'


2025-11-14 17:50:39,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,578 - INFO - Going to convert document batch...
2025-11-14 17:50:39,579 - INFO - Processing document 4_2024-02-20
2025-11-14 17:50:39,609 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.
2025-11-14 17:50:39,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,671 - INFO - Going to convert document batch...
2025-11-14 17:50:39,672 - INFO - Processing document 4_2024-02-23
2025-11-14 17:50:39,693 - INFO - Finished converting document 4_2024-02-23 in 0.05 sec.
2025-11-14 17:50:39,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\USB\4_2024-02-16' --> 'data\processed_data\USB\4_2024-02-16.md'
Converted 'data\edgar_documents\USB\4_2024-02-20' --> 'data\processed_data\USB\4_2024-02-20.md'
Converted 'data\edgar_documents\USB\4_2024-02-23' --> 'data\processed_data\USB\4_2024-02-23.md'


2025-11-14 17:50:39,738 - INFO - Going to convert document batch...
2025-11-14 17:50:39,739 - INFO - Processing document 4_2024-03-04
2025-11-14 17:50:39,757 - INFO - Finished converting document 4_2024-03-04 in 0.03 sec.
2025-11-14 17:50:39,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,800 - INFO - Going to convert document batch...
2025-11-14 17:50:39,801 - INFO - Processing document 4_2024-03-05
2025-11-14 17:50:39,826 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 17:50:39,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,879 - INFO - Going to convert document batch...
2025-11-14 17:50:39,879 - INFO - Processing document 4_2024-03-06
2025-11-14 17:50:39,896 - INFO - Finished converting document 4_2024-03-06 in 0.05 sec.
2025-11-14 17:50:39,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:39,955 - INFO - Going to convert document batch...
2025-11-14 17:50:39,956 - 

Converted 'data\edgar_documents\USB\4_2024-03-04' --> 'data\processed_data\USB\4_2024-03-04.md'
Converted 'data\edgar_documents\USB\4_2024-03-05' --> 'data\processed_data\USB\4_2024-03-05.md'
Converted 'data\edgar_documents\USB\4_2024-03-06' --> 'data\processed_data\USB\4_2024-03-06.md'


2025-11-14 17:50:40,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:40,021 - INFO - Going to convert document batch...
2025-11-14 17:50:40,022 - INFO - Processing document 4_2024-05-07
2025-11-14 17:50:40,040 - INFO - Finished converting document 4_2024-05-07 in 0.03 sec.
2025-11-14 17:50:40,092 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:40,093 - ERROR - Input document 4_2024-05-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50

Converted 'data\edgar_documents\USB\4_2024-04-19' --> 'data\processed_data\USB\4_2024-04-19.md'
Converted 'data\edgar_documents\USB\4_2024-05-07' --> 'data\processed_data\USB\4_2024-05-07.md'
Error processing data\edgar_documents\USB\4_2024-05-14: File format not allowed: data\edgar_documents\USB\4_2024-05-14
Error processing data\edgar_documents\USB\4_2024-05-15: File format not allowed: data\edgar_documents\USB\4_2024-05-15


2025-11-14 17:50:40,236 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:40,236 - ERROR - Input document 4_2024-07-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:40,238 - INFO - Going to convert document batch...
2025-11-14 17:50:40,251 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:40,251 - ERROR - Input document 4_2024-07-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\USB\4_2024-07-18' --> 'data\processed_data\USB\4_2024-07-18.md'
Error processing data\edgar_documents\USB\4_2024-07-19: File format not allowed: data\edgar_documents\USB\4_2024-07-19
Error processing data\edgar_documents\USB\4_2024-07-24: File format not allowed: data\edgar_documents\USB\4_2024-07-24
Error processing data\edgar_documents\USB\4_2024-07-26: File format not allowed: data\edgar_documents\USB\4_2024-07-26
Error processing data\edgar_documents\USB\4_2024-09-19: File format not allowed: data\edgar_documents\USB\4_2024-09-19
Error processing data\edgar_documents\USB\4_2024-09-20: File format not allowed: data\edgar_documents\USB\4_2024-09-20
Converted 'data\edgar_documents\USB\4_2024-10-21' --> 'data\processed_data\USB\4_2024-10-21.md'


2025-11-14 17:50:40,436 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:40,436 - ERROR - Input document 4_2024-10-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:40,437 - INFO - Going to convert document batch...
2025-11-14 17:50:40,449 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:40,450 - ERROR - Input document 4_2024-10-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\USB\4_2024-10-22' --> 'data\processed_data\USB\4_2024-10-22.md'
Error processing data\edgar_documents\USB\4_2024-10-23: File format not allowed: data\edgar_documents\USB\4_2024-10-23
Error processing data\edgar_documents\USB\4_2024-10-24: File format not allowed: data\edgar_documents\USB\4_2024-10-24
Error processing data\edgar_documents\USB\4_2024-10-25: File format not allowed: data\edgar_documents\USB\4_2024-10-25
Error processing data\edgar_documents\USB\4_2024-10-28: File format not allowed: data\edgar_documents\USB\4_2024-10-28
Error processing data\edgar_documents\USB\4_2024-10-29: File format not allowed: data\edgar_documents\USB\4_2024-10-29
Error processing data\edgar_documents\USB\4_2024-10-30: File format not allowed: data\edgar_documents\USB\4_2024-10-30
Error processing data\edgar_documents\USB\4_2024-10-31: File format not allowed: data\edgar_documents\USB\4_2024-10-31
Error processing data\edgar_documents\USB\4_2024-11-05: File format not

2025-11-14 17:50:40,608 - ERROR - Input document 4_2024-11-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:40,609 - INFO - Going to convert document batch...
2025-11-14 17:50:40,623 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:40,624 - ERROR - Input document 4_2024-12-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\USB\4_2024-11-26: File format not allowed: data\edgar_documents\USB\4_2024-11-26
Error processing data\edgar_documents\USB\4_2024-12-04: File format not allowed: data\edgar_documents\USB\4_2024-12-04
Error processing data\edgar_documents\USB\4_2024-12-05: File format not allowed: data\edgar_documents\USB\4_2024-12-05
Converted 'data\edgar_documents\USB\4_2024-12-17' --> 'data\processed_data\USB\4_2024-12-17.md'
Error processing data\edgar_documents\USB\4_2024-12-18: File format not allowed: data\edgar_documents\USB\4_2024-12-18


2025-11-14 17:50:40,802 - INFO - Finished converting document 4_2025-02-05 in 0.05 sec.
2025-11-14 17:50:40,837 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:40,838 - ERROR - Input document 4_2025-02-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:40,839 - INFO - Going to convert document batch...
2025-11-14 17:50:40,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:40,862 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\USB\4_2025-02-05' --> 'data\processed_data\USB\4_2025-02-05.md'
Error processing data\edgar_documents\USB\4_2025-02-06: File format not allowed: data\edgar_documents\USB\4_2025-02-06
Converted 'data\edgar_documents\USB\4_2025-02-07' --> 'data\processed_data\USB\4_2025-02-07.md'
Converted 'data\edgar_documents\USB\4_2025-02-13' --> 'data\processed_data\USB\4_2025-02-13.md'


2025-11-14 17:50:41,045 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:41,046 - ERROR - Input document 4_2025-02-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:41,047 - INFO - Going to convert document batch...
2025-11-14 17:50:41,060 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:41,061 - ERROR - Input document 4_2025-02-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\USB\4_2025-02-14' --> 'data\processed_data\USB\4_2025-02-14.md'
Error processing data\edgar_documents\USB\4_2025-02-18: File format not allowed: data\edgar_documents\USB\4_2025-02-18
Error processing data\edgar_documents\USB\4_2025-02-19: File format not allowed: data\edgar_documents\USB\4_2025-02-19
Error processing data\edgar_documents\USB\4_2025-02-20: File format not allowed: data\edgar_documents\USB\4_2025-02-20
Error processing data\edgar_documents\USB\4_2025-02-21: File format not allowed: data\edgar_documents\USB\4_2025-02-21
Error processing data\edgar_documents\USB\4_2025-02-24: File format not allowed: data\edgar_documents\USB\4_2025-02-24
Error processing data\edgar_documents\USB\4_2025-02-25: File format not allowed: data\edgar_documents\USB\4_2025-02-25
Error processing data\edgar_documents\USB\4_2025-02-26: File format not allowed: data\edgar_documents\USB\4_2025-02-26
Error processing data\edgar_documents\USB\4_2025-02-27: File format not

2025-11-14 17:50:41,254 - INFO - Going to convert document batch...
2025-11-14 17:50:41,255 - INFO - Processing document 4_2025-03-04
2025-11-14 17:50:41,274 - INFO - Finished converting document 4_2025-03-04 in 0.03 sec.
2025-11-14 17:50:41,324 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:41,325 - ERROR - Input document 4_2025-03-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:41,327 - INFO - Going to convert document batch...
2025-11-14 17:50:41,345 - IN

Converted 'data\edgar_documents\USB\4_2025-03-04' --> 'data\processed_data\USB\4_2025-03-04.md'
Error processing data\edgar_documents\USB\4_2025-03-10: File format not allowed: data\edgar_documents\USB\4_2025-03-10
Error processing data\edgar_documents\USB\4_2025-03-11: File format not allowed: data\edgar_documents\USB\4_2025-03-11
Error processing data\edgar_documents\USB\4_2025-03-12: File format not allowed: data\edgar_documents\USB\4_2025-03-12
Error processing data\edgar_documents\USB\4_2025-03-13: File format not allowed: data\edgar_documents\USB\4_2025-03-13
Error processing data\edgar_documents\USB\4_2025-03-14: File format not allowed: data\edgar_documents\USB\4_2025-03-14
Error processing data\edgar_documents\USB\4_2025-03-20: File format not allowed: data\edgar_documents\USB\4_2025-03-20
Error processing data\edgar_documents\USB\4_2025-03-21: File format not allowed: data\edgar_documents\USB\4_2025-03-21


2025-11-14 17:50:41,503 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:41,504 - ERROR - Input document 4_2025-04-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:41,505 - INFO - Going to convert document batch...
2025-11-14 17:50:41,520 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:41,521 - ERROR - Input document 4_2025-04-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\USB\4_2025-04-21' --> 'data\processed_data\USB\4_2025-04-21.md'
Error processing data\edgar_documents\USB\4_2025-04-23: File format not allowed: data\edgar_documents\USB\4_2025-04-23
Error processing data\edgar_documents\USB\4_2025-04-24: File format not allowed: data\edgar_documents\USB\4_2025-04-24
Error processing data\edgar_documents\USB\4_2025-04-28: File format not allowed: data\edgar_documents\USB\4_2025-04-28
Error processing data\edgar_documents\USB\4_2025-04-29: File format not allowed: data\edgar_documents\USB\4_2025-04-29
Error processing data\edgar_documents\USB\4_2025-05-01: File format not allowed: data\edgar_documents\USB\4_2025-05-01
Error processing data\edgar_documents\USB\4_2025-05-06: File format not allowed: data\edgar_documents\USB\4_2025-05-06
Error processing data\edgar_documents\USB\4_2025-05-08: File format not allowed: data\edgar_documents\USB\4_2025-05-08
Error processing data\edgar_documents\USB\4_2025-05-09: File format not

2025-11-14 17:50:41,675 - ERROR - Input document 4_2025-05-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:41,676 - INFO - Going to convert document batch...
2025-11-14 17:50:41,690 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:41,690 - ERROR - Input document 4_2025-05-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\USB\4_2025-05-16: File format not allowed: data\edgar_documents\USB\4_2025-05-16
Error processing data\edgar_documents\USB\4_2025-05-20: File format not allowed: data\edgar_documents\USB\4_2025-05-20
Error processing data\edgar_documents\USB\4_2025-05-21: File format not allowed: data\edgar_documents\USB\4_2025-05-21
Error processing data\edgar_documents\USB\4_2025-05-22: File format not allowed: data\edgar_documents\USB\4_2025-05-22
Error processing data\edgar_documents\USB\4_2025-05-28: File format not allowed: data\edgar_documents\USB\4_2025-05-28
Error processing data\edgar_documents\USB\4_2025-05-29: File format not allowed: data\edgar_documents\USB\4_2025-05-29
Error processing data\edgar_documents\USB\4_2025-06-02: File format not allowed: data\edgar_documents\USB\4_2025-06-02
Error processing data\edgar_documents\USB\4_2025-06-03: File format not allowed: data\edgar_documents\USB\4_2025-06-03
Converted 'data\edgar_documents\USB\4_2025-06-10

2025-11-14 17:50:41,863 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:41,864 - ERROR - Input document 4_2025-06-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:41,865 - INFO - Going to convert document batch...
2025-11-14 17:50:41,878 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:41,879 - ERROR - Input document 4_2025-06-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\USB\4_2025-06-11: File format not allowed: data\edgar_documents\USB\4_2025-06-11
Error processing data\edgar_documents\USB\4_2025-06-12: File format not allowed: data\edgar_documents\USB\4_2025-06-12
Error processing data\edgar_documents\USB\4_2025-06-18: File format not allowed: data\edgar_documents\USB\4_2025-06-18
Error processing data\edgar_documents\USB\4_2025-07-21: File format not allowed: data\edgar_documents\USB\4_2025-07-21
Converted 'data\edgar_documents\USB\4_2025-07-22' --> 'data\processed_data\USB\4_2025-07-22.md'
Error processing data\edgar_documents\USB\4_2025-07-28: File format not allowed: data\edgar_documents\USB\4_2025-07-28


2025-11-14 17:50:42,079 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:42,080 - ERROR - Input document 4_2025-08-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:42,081 - INFO - Going to convert document batch...
2025-11-14 17:50:42,094 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:42,095 - ERROR - Input document 4_2025-08-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\USB\4_2025-07-31' --> 'data\processed_data\USB\4_2025-07-31.md'
Error processing data\edgar_documents\USB\4_2025-08-04: File format not allowed: data\edgar_documents\USB\4_2025-08-04
Error processing data\edgar_documents\USB\4_2025-08-05: File format not allowed: data\edgar_documents\USB\4_2025-08-05
Error processing data\edgar_documents\USB\4_2025-08-06: File format not allowed: data\edgar_documents\USB\4_2025-08-06
Error processing data\edgar_documents\USB\4_2025-08-11: File format not allowed: data\edgar_documents\USB\4_2025-08-11
Error processing data\edgar_documents\USB\4_2025-08-12: File format not allowed: data\edgar_documents\USB\4_2025-08-12
Error processing data\edgar_documents\USB\4_2025-08-13: File format not allowed: data\edgar_documents\USB\4_2025-08-13
Error processing data\edgar_documents\USB\4_2025-08-18: File format not allowed: data\edgar_documents\USB\4_2025-08-18
Error processing data\edgar_documents\USB\4_2025-08-22: File format not

2025-11-14 17:50:42,249 - ERROR - Input document 4_2025-09-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:42,249 - INFO - Going to convert document batch...
2025-11-14 17:50:42,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:42,270 - INFO - Going to convert document batch...
2025-11-14 17:50:42,271 - INFO - Processing document 4_2025-10-21
2025-11-14 17:50:42,301 - INFO - Finished converting document 4_2025-10-21 in 0.05 sec.
2025-11-14 17:50:42,372 - INFO - detec

Error processing data\edgar_documents\USB\4_2025-09-10: File format not allowed: data\edgar_documents\USB\4_2025-09-10
Converted 'data\edgar_documents\USB\4_2025-10-21' --> 'data\processed_data\USB\4_2025-10-21.md'
Converted 'data\edgar_documents\USB\4_2025-10-22' --> 'data\processed_data\USB\4_2025-10-22.md'


2025-11-14 17:50:42,464 - INFO - Going to convert document batch...
2025-11-14 17:50:42,465 - INFO - Processing document 8-K_2023-01-24
2025-11-14 17:50:42,485 - INFO - Finished converting document 8-K_2023-01-24 in 0.05 sec.
2025-11-14 17:50:42,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:42,521 - INFO - Going to convert document batch...
2025-11-14 17:50:42,522 - INFO - Processing document 8-K_2023-01-25
2025-11-14 17:50:42,539 - INFO - Finished converting document 8-K_2023-01-25 in 0.03 sec.
2025-11-14 17:50:42,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:42,577 - INFO - Going to convert document batch...
2025-11-14 17:50:42,577 - INFO - Processing document 8-K_2023-02-16
2025-11-14 17:50:42,597 - INFO - Finished converting document 8-K_2023-02-16 in 0.05 sec.
2025-11-14 17:50:42,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:42,634 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\USB\8-K_2023-01-24' --> 'data\processed_data\USB\8-K_2023-01-24.md'
Converted 'data\edgar_documents\USB\8-K_2023-01-25' --> 'data\processed_data\USB\8-K_2023-01-25.md'
Converted 'data\edgar_documents\USB\8-K_2023-02-16' --> 'data\processed_data\USB\8-K_2023-02-16.md'
Converted 'data\edgar_documents\USB\8-K_2023-03-08' --> 'data\processed_data\USB\8-K_2023-03-08.md'


2025-11-14 17:50:42,692 - INFO - Processing document 8-K_2023-04-12
2025-11-14 17:50:42,707 - INFO - Finished converting document 8-K_2023-04-12 in 0.05 sec.
2025-11-14 17:50:42,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:42,744 - INFO - Going to convert document batch...
2025-11-14 17:50:42,745 - INFO - Processing document 8-K_2023-04-19
2025-11-14 17:50:42,763 - INFO - Finished converting document 8-K_2023-04-19 in 0.05 sec.
2025-11-14 17:50:42,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:42,812 - INFO - Going to convert document batch...
2025-11-14 17:50:42,813 - INFO - Processing document 8-K_2023-04-20
2025-11-14 17:50:42,847 - INFO - Finished converting document 8-K_2023-04-20 in 0.08 sec.
2025-11-14 17:50:42,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:42,892 - INFO - Going to convert document batch...
2025-11-14 17:50:42,893 - INFO - Processing document 8-K_2023-04-21
2025-11-14 17:

Converted 'data\edgar_documents\USB\8-K_2023-04-12' --> 'data\processed_data\USB\8-K_2023-04-12.md'
Converted 'data\edgar_documents\USB\8-K_2023-04-19' --> 'data\processed_data\USB\8-K_2023-04-19.md'
Converted 'data\edgar_documents\USB\8-K_2023-04-20' --> 'data\processed_data\USB\8-K_2023-04-20.md'


2025-11-14 17:50:42,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:42,966 - INFO - Going to convert document batch...
2025-11-14 17:50:42,966 - INFO - Processing document 8-K_2023-05-16
2025-11-14 17:50:42,985 - INFO - Finished converting document 8-K_2023-05-16 in 0.05 sec.
2025-11-14 17:50:43,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:43,041 - INFO - Going to convert document batch...
2025-11-14 17:50:43,042 - INFO - Processing document 8-K_2023-07-19
2025-11-14 17:50:43,067 - INFO - Finished converting document 8-K_2023-07-19 in 0.06 sec.
2025-11-14 17:50:43,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:43,109 - INFO - Going to convert document batch...
2025-11-14 17:50:43,109 - INFO - Processing document 8-K_2023-08-03


Converted 'data\edgar_documents\USB\8-K_2023-04-21' --> 'data\processed_data\USB\8-K_2023-04-21.md'
Converted 'data\edgar_documents\USB\8-K_2023-05-16' --> 'data\processed_data\USB\8-K_2023-05-16.md'
Converted 'data\edgar_documents\USB\8-K_2023-07-19' --> 'data\processed_data\USB\8-K_2023-07-19.md'


2025-11-14 17:50:43,130 - INFO - Finished converting document 8-K_2023-08-03 in 0.05 sec.
2025-11-14 17:50:43,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:43,168 - INFO - Going to convert document batch...
2025-11-14 17:50:43,169 - INFO - Processing document 8-K_2023-08-23
2025-11-14 17:50:43,185 - INFO - Finished converting document 8-K_2023-08-23 in 0.05 sec.
2025-11-14 17:50:43,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:43,221 - INFO - Going to convert document batch...
2025-11-14 17:50:43,222 - INFO - Processing document 8-K_2023-09-13
2025-11-14 17:50:43,242 - INFO - Finished converting document 8-K_2023-09-13 in 0.05 sec.
2025-11-14 17:50:43,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:43,276 - INFO - Going to convert document batch...
2025-11-14 17:50:43,277 - INFO - Processing document 8-K_2023-10-17
2025-11-14 17:50:43,290 - INFO - Finished converting document 8-K_2023-10-17 in 0.

Converted 'data\edgar_documents\USB\8-K_2023-08-03' --> 'data\processed_data\USB\8-K_2023-08-03.md'
Converted 'data\edgar_documents\USB\8-K_2023-08-23' --> 'data\processed_data\USB\8-K_2023-08-23.md'
Converted 'data\edgar_documents\USB\8-K_2023-09-13' --> 'data\processed_data\USB\8-K_2023-09-13.md'
Converted 'data\edgar_documents\USB\8-K_2023-10-17' --> 'data\processed_data\USB\8-K_2023-10-17.md'


2025-11-14 17:50:43,921 - INFO - Going to convert document batch...
2025-11-14 17:50:43,922 - INFO - Processing document 8-K_2023-10-18
2025-11-14 17:50:43,934 - INFO - Finished converting document 8-K_2023-10-18 in 0.64 sec.
2025-11-14 17:50:43,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:43,969 - INFO - Going to convert document batch...
2025-11-14 17:50:43,970 - INFO - Processing document 8-K_2023-10-19
2025-11-14 17:50:43,992 - INFO - Finished converting document 8-K_2023-10-19 in 0.05 sec.
2025-11-14 17:50:44,023 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,034 - INFO - Going to convert document batch...
2025-11-14 17:50:44,034 - INFO - Processing document 8-K_2023-11-01
2025-11-14 17:50:44,051 - INFO - Finished converting document 8-K_2023-11-01 in 0.05 sec.
2025-11-14 17:50:44,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,082 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\USB\8-K_2023-10-18' --> 'data\processed_data\USB\8-K_2023-10-18.md'
Converted 'data\edgar_documents\USB\8-K_2023-10-19' --> 'data\processed_data\USB\8-K_2023-10-19.md'
Converted 'data\edgar_documents\USB\8-K_2023-11-01' --> 'data\processed_data\USB\8-K_2023-11-01.md'
Converted 'data\edgar_documents\USB\8-K_2023-12-06' --> 'data\processed_data\USB\8-K_2023-12-06.md'


2025-11-14 17:50:44,132 - INFO - Going to convert document batch...
2025-11-14 17:50:44,134 - INFO - Processing document 8-K_2024-01-17
2025-11-14 17:50:44,150 - INFO - Finished converting document 8-K_2024-01-17 in 0.03 sec.
2025-11-14 17:50:44,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,202 - INFO - Going to convert document batch...
2025-11-14 17:50:44,204 - INFO - Processing document 8-K_2024-02-21
2025-11-14 17:50:44,226 - INFO - Finished converting document 8-K_2024-02-21 in 0.06 sec.
2025-11-14 17:50:44,253 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,265 - INFO - Going to convert document batch...
2025-11-14 17:50:44,266 - INFO - Processing document 8-K_2024-03-05
2025-11-14 17:50:44,282 - INFO - Finished converting document 8-K_2024-03-05 in 0.05 sec.
2025-11-14 17:50:44,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,314 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\USB\8-K_2024-01-17' --> 'data\processed_data\USB\8-K_2024-01-17.md'
Converted 'data\edgar_documents\USB\8-K_2024-02-21' --> 'data\processed_data\USB\8-K_2024-02-21.md'
Converted 'data\edgar_documents\USB\8-K_2024-03-05' --> 'data\processed_data\USB\8-K_2024-03-05.md'
Converted 'data\edgar_documents\USB\8-K_2024-04-17' --> 'data\processed_data\USB\8-K_2024-04-17.md'


2025-11-14 17:50:44,383 - INFO - Going to convert document batch...
2025-11-14 17:50:44,383 - INFO - Processing document 8-K_2024-04-18
2025-11-14 17:50:44,422 - INFO - Finished converting document 8-K_2024-04-18 in 0.08 sec.
2025-11-14 17:50:44,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,466 - INFO - Going to convert document batch...
2025-11-14 17:50:44,467 - INFO - Processing document 8-K_2024-05-03
2025-11-14 17:50:44,485 - INFO - Finished converting document 8-K_2024-05-03 in 0.05 sec.
2025-11-14 17:50:44,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,535 - INFO - Going to convert document batch...
2025-11-14 17:50:44,536 - INFO - Processing document 8-K_2024-05-06
2025-11-14 17:50:44,563 - INFO - Finished converting document 8-K_2024-05-06 in 0.06 sec.
2025-11-14 17:50:44,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,633 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\USB\8-K_2024-04-18' --> 'data\processed_data\USB\8-K_2024-04-18.md'
Converted 'data\edgar_documents\USB\8-K_2024-05-03' --> 'data\processed_data\USB\8-K_2024-05-03.md'
Converted 'data\edgar_documents\USB\8-K_2024-05-06' --> 'data\processed_data\USB\8-K_2024-05-06.md'


2025-11-14 17:50:44,634 - INFO - Processing document 8-K_2024-05-31
2025-11-14 17:50:44,654 - INFO - Finished converting document 8-K_2024-05-31 in 0.08 sec.
2025-11-14 17:50:44,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,692 - INFO - Going to convert document batch...
2025-11-14 17:50:44,693 - INFO - Processing document 8-K_2024-06-27
2025-11-14 17:50:44,714 - INFO - Finished converting document 8-K_2024-06-27 in 0.06 sec.
2025-11-14 17:50:44,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,749 - INFO - Going to convert document batch...
2025-11-14 17:50:44,750 - INFO - Processing document 8-K_2024-07-01
2025-11-14 17:50:44,765 - INFO - Finished converting document 8-K_2024-07-01 in 0.05 sec.
2025-11-14 17:50:44,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,798 - INFO - Going to convert document batch...
2025-11-14 17:50:44,799 - INFO - Processing document 8-K_2024-07-16
2025-11-14 17:

Converted 'data\edgar_documents\USB\8-K_2024-05-31' --> 'data\processed_data\USB\8-K_2024-05-31.md'
Converted 'data\edgar_documents\USB\8-K_2024-06-27' --> 'data\processed_data\USB\8-K_2024-06-27.md'
Converted 'data\edgar_documents\USB\8-K_2024-07-01' --> 'data\processed_data\USB\8-K_2024-07-01.md'
Converted 'data\edgar_documents\USB\8-K_2024-07-16' --> 'data\processed_data\USB\8-K_2024-07-16.md'


2025-11-14 17:50:44,847 - INFO - Going to convert document batch...
2025-11-14 17:50:44,848 - INFO - Processing document 8-K_2024-07-17
2025-11-14 17:50:44,867 - INFO - Finished converting document 8-K_2024-07-17 in 0.03 sec.
2025-11-14 17:50:44,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,902 - INFO - Going to convert document batch...
2025-11-14 17:50:44,903 - INFO - Processing document 8-K_2024-08-21
2025-11-14 17:50:44,921 - INFO - Finished converting document 8-K_2024-08-21 in 0.05 sec.
2025-11-14 17:50:44,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:44,956 - INFO - Going to convert document batch...
2025-11-14 17:50:44,957 - INFO - Processing document 8-K_2024-09-12
2025-11-14 17:50:44,973 - INFO - Finished converting document 8-K_2024-09-12 in 0.05 sec.
2025-11-14 17:50:44,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,008 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\USB\8-K_2024-07-17' --> 'data\processed_data\USB\8-K_2024-07-17.md'
Converted 'data\edgar_documents\USB\8-K_2024-08-21' --> 'data\processed_data\USB\8-K_2024-08-21.md'
Converted 'data\edgar_documents\USB\8-K_2024-09-12' --> 'data\processed_data\USB\8-K_2024-09-12.md'
Converted 'data\edgar_documents\USB\8-K_2024-09-20' --> 'data\processed_data\USB\8-K_2024-09-20.md'


2025-11-14 17:50:45,065 - INFO - Processing document 8-K_2024-10-15
2025-11-14 17:50:45,084 - INFO - Finished converting document 8-K_2024-10-15 in 0.05 sec.
2025-11-14 17:50:45,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,124 - INFO - Going to convert document batch...
2025-11-14 17:50:45,125 - INFO - Processing document 8-K_2024-10-16
2025-11-14 17:50:45,144 - INFO - Finished converting document 8-K_2024-10-16 in 0.05 sec.
2025-11-14 17:50:45,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,186 - INFO - Going to convert document batch...
2025-11-14 17:50:45,187 - INFO - Processing document 8-K_2024-11-07
2025-11-14 17:50:45,205 - INFO - Finished converting document 8-K_2024-11-07 in 0.05 sec.
2025-11-14 17:50:45,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,238 - INFO - Going to convert document batch...
2025-11-14 17:50:45,239 - INFO - Processing document 8-K_2025-01-16
2025-11-14 17:

Converted 'data\edgar_documents\USB\8-K_2024-10-15' --> 'data\processed_data\USB\8-K_2024-10-15.md'
Converted 'data\edgar_documents\USB\8-K_2024-10-16' --> 'data\processed_data\USB\8-K_2024-10-16.md'
Converted 'data\edgar_documents\USB\8-K_2024-11-07' --> 'data\processed_data\USB\8-K_2024-11-07.md'
Converted 'data\edgar_documents\USB\8-K_2025-01-16' --> 'data\processed_data\USB\8-K_2025-01-16.md'


2025-11-14 17:50:45,295 - INFO - Going to convert document batch...
2025-11-14 17:50:45,296 - INFO - Processing document 8-K_2025-01-28
2025-11-14 17:50:45,316 - INFO - Finished converting document 8-K_2025-01-28 in 0.05 sec.
2025-11-14 17:50:45,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,368 - INFO - Going to convert document batch...
2025-11-14 17:50:45,369 - INFO - Processing document 8-K_2025-01-31
2025-11-14 17:50:45,396 - INFO - Finished converting document 8-K_2025-01-31 in 0.06 sec.
2025-11-14 17:50:45,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,467 - INFO - Going to convert document batch...
2025-11-14 17:50:45,468 - INFO - Processing document 8-K_2025-03-25
2025-11-14 17:50:45,494 - INFO - Finished converting document 8-K_2025-03-25 in 0.06 sec.
2025-11-14 17:50:45,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\USB\8-K_2025-01-28' --> 'data\processed_data\USB\8-K_2025-01-28.md'
Converted 'data\edgar_documents\USB\8-K_2025-01-31' --> 'data\processed_data\USB\8-K_2025-01-31.md'
Converted 'data\edgar_documents\USB\8-K_2025-03-25' --> 'data\processed_data\USB\8-K_2025-03-25.md'


2025-11-14 17:50:45,537 - INFO - Going to convert document batch...
2025-11-14 17:50:45,537 - INFO - Processing document 8-K_2025-03-31
2025-11-14 17:50:45,554 - INFO - Finished converting document 8-K_2025-03-31 in 0.05 sec.
2025-11-14 17:50:45,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,594 - INFO - Going to convert document batch...
2025-11-14 17:50:45,594 - INFO - Processing document 8-K_2025-04-16
2025-11-14 17:50:45,614 - INFO - Finished converting document 8-K_2025-04-16 in 0.05 sec.
2025-11-14 17:50:45,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,657 - INFO - Going to convert document batch...
2025-11-14 17:50:45,658 - INFO - Processing document 8-K_2025-04-17
2025-11-14 17:50:45,691 - INFO - Finished converting document 8-K_2025-04-17 in 0.06 sec.
2025-11-14 17:50:45,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,730 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\USB\8-K_2025-03-31' --> 'data\processed_data\USB\8-K_2025-03-31.md'
Converted 'data\edgar_documents\USB\8-K_2025-04-16' --> 'data\processed_data\USB\8-K_2025-04-16.md'
Converted 'data\edgar_documents\USB\8-K_2025-04-17' --> 'data\processed_data\USB\8-K_2025-04-17.md'


2025-11-14 17:50:45,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,779 - INFO - Going to convert document batch...
2025-11-14 17:50:45,780 - INFO - Processing document 8-K_2025-07-17
2025-11-14 17:50:45,799 - INFO - Finished converting document 8-K_2025-07-17 in 0.05 sec.
2025-11-14 17:50:45,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,838 - INFO - Going to convert document batch...
2025-11-14 17:50:45,838 - INFO - Processing document 8-K_2025-08-14
2025-11-14 17:50:45,861 - INFO - Finished converting document 8-K_2025-08-14 in 0.05 sec.
2025-11-14 17:50:45,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,895 - INFO - Going to convert document batch...
2025-11-14 17:50:45,895 - INFO - Processing document 8-K_2025-10-16
2025-11-14 17:50:45,912 - INFO - Finished converting document 8-K_2025-10-16 in 0.03 sec.


Converted 'data\edgar_documents\USB\8-K_2025-07-02' --> 'data\processed_data\USB\8-K_2025-07-02.md'
Converted 'data\edgar_documents\USB\8-K_2025-07-17' --> 'data\processed_data\USB\8-K_2025-07-17.md'
Converted 'data\edgar_documents\USB\8-K_2025-08-14' --> 'data\processed_data\USB\8-K_2025-08-14.md'
Converted 'data\edgar_documents\USB\8-K_2025-10-16' --> 'data\processed_data\USB\8-K_2025-10-16.md'


2025-11-14 17:50:45,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:45,971 - INFO - Going to convert document batch...
2025-11-14 17:50:45,972 - INFO - Processing document 8-K_2025-11-06
2025-11-14 17:50:45,988 - INFO - Finished converting document 8-K_2025-11-06 in 0.06 sec.
2025-11-14 17:50:46,042 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:46,043 - ERROR - Input document DEF-14A_2023-03-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>

Converted 'data\edgar_documents\USB\8-K_2025-11-06' --> 'data\processed_data\USB\8-K_2025-11-06.md'
Error processing data\edgar_documents\USB\DEF-14A_2023-03-07: File format not allowed: data\edgar_documents\USB\DEF-14A_2023-03-07


2025-11-14 17:50:47,137 - INFO - Going to convert document batch...
2025-11-14 17:50:47,138 - INFO - Processing document DEF-14A_2024-03-05
2025-11-14 17:50:55,280 - INFO - Finished converting document DEF-14A_2024-03-05 in 9.23 sec.
2025-11-14 17:50:56,178 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:50:56,179 - ERROR - Input document DEF-14A_2025-03-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:50:56,182 - INFO - Going to 

Converted 'data\edgar_documents\USB\DEF-14A_2024-03-05' --> 'data\processed_data\USB\DEF-14A_2024-03-05.md'
Error processing data\edgar_documents\USB\DEF-14A_2025-03-05: File format not allowed: data\edgar_documents\USB\DEF-14A_2025-03-05
Processed 99 new files. Errors: 85
Found 133 files to process in data\edgar_documents\V


2025-11-14 17:50:56,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:50:57,132 - INFO - Going to convert document batch...
2025-11-14 17:50:57,133 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:50:57,133 - INFO - Processing document 10-K_2023-11-15
2025-11-14 17:50:58,751 - INFO - Finished converting document 10-K_2023-11-15 in 2.55 sec.
2025-11-14 17:50:59,481 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-K_2023-11-15' --> 'data\processed_data\V\10-K_2023-11-15.md'


2025-11-14 17:51:00,344 - INFO - Going to convert document batch...
2025-11-14 17:51:00,345 - INFO - Processing document 10-K_2024-11-13
2025-11-14 17:51:01,832 - INFO - Finished converting document 10-K_2024-11-13 in 2.39 sec.
2025-11-14 17:51:02,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-K_2024-11-13' --> 'data\processed_data\V\10-K_2024-11-13.md'


2025-11-14 17:51:03,180 - INFO - Going to convert document batch...
2025-11-14 17:51:03,181 - INFO - Processing document 10-K_2025-11-06
2025-11-14 17:51:04,988 - INFO - Finished converting document 10-K_2025-11-06 in 2.44 sec.
2025-11-14 17:51:05,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-K_2025-11-06' --> 'data\processed_data\V\10-K_2025-11-06.md'


2025-11-14 17:51:06,063 - INFO - Going to convert document batch...
2025-11-14 17:51:06,064 - INFO - Processing document 10-Q_2023-01-27
2025-11-14 17:51:06,769 - INFO - Finished converting document 10-Q_2023-01-27 in 1.11 sec.
2025-11-14 17:51:07,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-Q_2023-01-27' --> 'data\processed_data\V\10-Q_2023-01-27.md'


2025-11-14 17:51:08,044 - INFO - Going to convert document batch...
2025-11-14 17:51:08,044 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 17:51:08,855 - INFO - Finished converting document 10-Q_2023-04-27 in 1.67 sec.
2025-11-14 17:51:09,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-Q_2023-04-27' --> 'data\processed_data\V\10-Q_2023-04-27.md'


2025-11-14 17:51:09,795 - INFO - Going to convert document batch...
2025-11-14 17:51:09,795 - INFO - Processing document 10-Q_2023-07-26
2025-11-14 17:51:10,654 - INFO - Finished converting document 10-Q_2023-07-26 in 1.30 sec.
2025-11-14 17:51:11,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-Q_2023-07-26' --> 'data\processed_data\V\10-Q_2023-07-26.md'


2025-11-14 17:51:11,880 - INFO - Going to convert document batch...
2025-11-14 17:51:11,881 - INFO - Processing document 10-Q_2024-01-26
2025-11-14 17:51:12,568 - INFO - Finished converting document 10-Q_2024-01-26 in 1.42 sec.
2025-11-14 17:51:13,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-Q_2024-01-26' --> 'data\processed_data\V\10-Q_2024-01-26.md'


2025-11-14 17:51:13,443 - INFO - Going to convert document batch...
2025-11-14 17:51:13,444 - INFO - Processing document 10-Q_2024-04-24
2025-11-14 17:51:14,622 - INFO - Finished converting document 10-Q_2024-04-24 in 1.64 sec.
2025-11-14 17:51:15,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-Q_2024-04-24' --> 'data\processed_data\V\10-Q_2024-04-24.md'


2025-11-14 17:51:15,649 - INFO - Going to convert document batch...
2025-11-14 17:51:15,649 - INFO - Processing document 10-Q_2024-07-24
2025-11-14 17:51:16,524 - INFO - Finished converting document 10-Q_2024-07-24 in 1.33 sec.
2025-11-14 17:51:17,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-Q_2024-07-24' --> 'data\processed_data\V\10-Q_2024-07-24.md'


2025-11-14 17:51:17,715 - INFO - Going to convert document batch...
2025-11-14 17:51:17,716 - INFO - Processing document 10-Q_2025-01-31
2025-11-14 17:51:18,433 - INFO - Finished converting document 10-Q_2025-01-31 in 1.41 sec.
2025-11-14 17:51:18,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-Q_2025-01-31' --> 'data\processed_data\V\10-Q_2025-01-31.md'


2025-11-14 17:51:19,272 - INFO - Going to convert document batch...
2025-11-14 17:51:19,273 - INFO - Processing document 10-Q_2025-04-30
2025-11-14 17:51:20,150 - INFO - Finished converting document 10-Q_2025-04-30 in 1.30 sec.
2025-11-14 17:51:20,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\10-Q_2025-04-30' --> 'data\processed_data\V\10-Q_2025-04-30.md'


2025-11-14 17:51:21,390 - INFO - Going to convert document batch...
2025-11-14 17:51:21,391 - INFO - Processing document 10-Q_2025-07-30
2025-11-14 17:51:22,263 - INFO - Finished converting document 10-Q_2025-07-30 in 1.61 sec.
2025-11-14 17:51:22,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:22,817 - INFO - Going to convert document batch...
2025-11-14 17:51:22,817 - INFO - Processing document 4_2023-01-10
2025-11-14 17:51:22,839 - INFO - Finished converting document 4_2023-01-10 in 0.03 sec.
2025-11-14 17:51:22,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:22,898 - INFO - Going to convert document batch...
2025-11-14 17:51:22,899 - INFO - Processing document 4_2023-01-18
2025-11-14 17:51:22,919 - INFO - Finished converting document 4_2023-01-18 in 0.06 sec.
2025-11-14 17:51:22,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:22,961 - INFO - Going to convert document batch...
2025-11-14 17:51:22,

Converted 'data\edgar_documents\V\10-Q_2025-07-30' --> 'data\processed_data\V\10-Q_2025-07-30.md'
Converted 'data\edgar_documents\V\4_2023-01-10' --> 'data\processed_data\V\4_2023-01-10.md'
Converted 'data\edgar_documents\V\4_2023-01-18' --> 'data\processed_data\V\4_2023-01-18.md'


2025-11-14 17:51:23,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,018 - INFO - Going to convert document batch...
2025-11-14 17:51:23,018 - INFO - Processing document 4_2023-02-03
2025-11-14 17:51:23,044 - INFO - Finished converting document 4_2023-02-03 in 0.05 sec.
2025-11-14 17:51:23,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,110 - INFO - Going to convert document batch...
2025-11-14 17:51:23,111 - INFO - Processing document 4_2023-02-17
2025-11-14 17:51:23,148 - INFO - Finished converting document 4_2023-02-17 in 0.08 sec.


Converted 'data\edgar_documents\V\4_2023-01-26' --> 'data\processed_data\V\4_2023-01-26.md'
Converted 'data\edgar_documents\V\4_2023-02-03' --> 'data\processed_data\V\4_2023-02-03.md'
Converted 'data\edgar_documents\V\4_2023-02-17' --> 'data\processed_data\V\4_2023-02-17.md'


2025-11-14 17:51:23,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,224 - INFO - Going to convert document batch...
2025-11-14 17:51:23,225 - INFO - Processing document 4_2023-02-27
2025-11-14 17:51:23,257 - INFO - Finished converting document 4_2023-02-27 in 0.06 sec.
2025-11-14 17:51:23,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,310 - INFO - Going to convert document batch...
2025-11-14 17:51:23,311 - INFO - Processing document 4_2023-03-08
2025-11-14 17:51:23,337 - INFO - Finished converting document 4_2023-03-08 in 0.05 sec.
2025-11-14 17:51:23,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,376 - INFO - Going to convert document batch...
2025-11-14 17:51:23,376 - INFO - Processing document 4_2023-05-01
2025-11-14 17:51:23,396 - INFO - Finished converting document 4_2023-05-01 in 0.03 sec.
2025-11-14 17:51:23,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\V\4_2023-02-27' --> 'data\processed_data\V\4_2023-02-27.md'
Converted 'data\edgar_documents\V\4_2023-03-08' --> 'data\processed_data\V\4_2023-03-08.md'
Converted 'data\edgar_documents\V\4_2023-05-01' --> 'data\processed_data\V\4_2023-05-01.md'
Converted 'data\edgar_documents\V\4_2023-05-02' --> 'data\processed_data\V\4_2023-05-02.md'


2025-11-14 17:51:23,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,520 - INFO - Going to convert document batch...
2025-11-14 17:51:23,521 - INFO - Processing document 4_2023-05-16
2025-11-14 17:51:23,540 - INFO - Finished converting document 4_2023-05-16 in 0.05 sec.
2025-11-14 17:51:23,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,586 - INFO - Going to convert document batch...
2025-11-14 17:51:23,587 - INFO - Processing document 4_2023-07-07
2025-11-14 17:51:23,624 - INFO - Finished converting document 4_2023-07-07 in 0.06 sec.
2025-11-14 17:51:23,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,698 - INFO - Going to convert document batch...
2025-11-14 17:51:23,699 - INFO - Processing document 4_2023-07-13
2025-11-14 17:51:23,722 - INFO - Finished converting document 4_2023-07-13 in 0.06 sec.
2025-11-14 17:51:23,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\4_2023-05-16' --> 'data\processed_data\V\4_2023-05-16.md'
Converted 'data\edgar_documents\V\4_2023-07-07' --> 'data\processed_data\V\4_2023-07-07.md'
Converted 'data\edgar_documents\V\4_2023-07-13' --> 'data\processed_data\V\4_2023-07-13.md'


2025-11-14 17:51:23,793 - INFO - Going to convert document batch...
2025-11-14 17:51:23,794 - INFO - Processing document 4_2023-08-02
2025-11-14 17:51:23,815 - INFO - Finished converting document 4_2023-08-02 in 0.06 sec.
2025-11-14 17:51:23,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,858 - INFO - Going to convert document batch...
2025-11-14 17:51:23,859 - INFO - Processing document 4_2023-08-16
2025-11-14 17:51:23,883 - INFO - Finished converting document 4_2023-08-16 in 0.05 sec.
2025-11-14 17:51:23,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:23,937 - INFO - Going to convert document batch...
2025-11-14 17:51:23,938 - INFO - Processing document 4_2023-09-01
2025-11-14 17:51:23,960 - INFO - Finished converting document 4_2023-09-01 in 0.05 sec.
2025-11-14 17:51:23,993 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:51:23,994 - ERROR - Input document 4_2023-09-13 with format None does 

Converted 'data\edgar_documents\V\4_2023-08-02' --> 'data\processed_data\V\4_2023-08-02.md'
Converted 'data\edgar_documents\V\4_2023-08-16' --> 'data\processed_data\V\4_2023-08-16.md'
Converted 'data\edgar_documents\V\4_2023-09-01' --> 'data\processed_data\V\4_2023-09-01.md'
Error processing data\edgar_documents\V\4_2023-09-13: File format not allowed: data\edgar_documents\V\4_2023-09-13
Error processing data\edgar_documents\V\4_2023-09-14: File format not allowed: data\edgar_documents\V\4_2023-09-14


2025-11-14 17:51:24,030 - INFO - Going to convert document batch...
2025-11-14 17:51:24,031 - INFO - Processing document 4_2023-09-15
2025-11-14 17:51:24,053 - INFO - Finished converting document 4_2023-09-15 in 0.05 sec.
2025-11-14 17:51:24,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,104 - INFO - Going to convert document batch...
2025-11-14 17:51:24,105 - INFO - Processing document 4_2023-10-17
2025-11-14 17:51:24,145 - INFO - Finished converting document 4_2023-10-17 in 0.06 sec.
2025-11-14 17:51:24,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,196 - INFO - Going to convert document batch...
2025-11-14 17:51:24,197 - INFO - Processing document 4_2023-11-02
2025-11-14 17:51:24,217 - INFO - Finished converting document 4_2023-11-02 in 0.05 sec.
2025-11-14 17:51:24,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,258 - INFO - Going to convert document batch...
2025-11-14 17:51:24,259 - 

Converted 'data\edgar_documents\V\4_2023-09-15' --> 'data\processed_data\V\4_2023-09-15.md'
Converted 'data\edgar_documents\V\4_2023-10-17' --> 'data\processed_data\V\4_2023-10-17.md'
Converted 'data\edgar_documents\V\4_2023-11-02' --> 'data\processed_data\V\4_2023-11-02.md'


2025-11-14 17:51:24,282 - INFO - Finished converting document 4_2023-11-03 in 0.05 sec.
2025-11-14 17:51:24,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,326 - INFO - Going to convert document batch...
2025-11-14 17:51:24,327 - INFO - Processing document 4_2023-11-20
2025-11-14 17:51:24,349 - INFO - Finished converting document 4_2023-11-20 in 0.05 sec.
2025-11-14 17:51:24,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,402 - INFO - Going to convert document batch...
2025-11-14 17:51:24,403 - INFO - Processing document 4_2023-11-21
2025-11-14 17:51:24,437 - INFO - Finished converting document 4_2023-11-21 in 0.06 sec.
2025-11-14 17:51:24,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,479 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\V\4_2023-11-03' --> 'data\processed_data\V\4_2023-11-03.md'
Converted 'data\edgar_documents\V\4_2023-11-20' --> 'data\processed_data\V\4_2023-11-20.md'
Converted 'data\edgar_documents\V\4_2023-11-21' --> 'data\processed_data\V\4_2023-11-21.md'


2025-11-14 17:51:24,480 - INFO - Processing document 4_2023-11-22
2025-11-14 17:51:24,497 - INFO - Finished converting document 4_2023-11-22 in 0.03 sec.
2025-11-14 17:51:24,530 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,541 - INFO - Going to convert document batch...
2025-11-14 17:51:24,541 - INFO - Processing document 4_2023-12-04
2025-11-14 17:51:24,568 - INFO - Finished converting document 4_2023-12-04 in 0.05 sec.
2025-11-14 17:51:24,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,610 - INFO - Going to convert document batch...
2025-11-14 17:51:24,610 - INFO - Processing document 4_2023-12-06
2025-11-14 17:51:24,626 - INFO - Finished converting document 4_2023-12-06 in 0.03 sec.
2025-11-14 17:51:24,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,667 - INFO - Going to convert document batch...
2025-11-14 17:51:24,668 - INFO - Processing document 4_2023-12-14
2025-11-14 17:51:24,692 - IN

Converted 'data\edgar_documents\V\4_2023-11-22' --> 'data\processed_data\V\4_2023-11-22.md'
Converted 'data\edgar_documents\V\4_2023-12-04' --> 'data\processed_data\V\4_2023-12-04.md'
Converted 'data\edgar_documents\V\4_2023-12-06' --> 'data\processed_data\V\4_2023-12-06.md'
Converted 'data\edgar_documents\V\4_2023-12-14' --> 'data\processed_data\V\4_2023-12-14.md'


2025-11-14 17:51:24,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,752 - INFO - Going to convert document batch...
2025-11-14 17:51:24,753 - INFO - Processing document 4_2024-01-03
2025-11-14 17:51:24,775 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 17:51:24,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,821 - INFO - Going to convert document batch...
2025-11-14 17:51:24,822 - INFO - Processing document 4_2024-01-16
2025-11-14 17:51:24,844 - INFO - Finished converting document 4_2024-01-16 in 0.05 sec.
2025-11-14 17:51:24,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:24,886 - INFO - Going to convert document batch...
2025-11-14 17:51:24,887 - INFO - Processing document 4_2024-01-22
2025-11-14 17:51:24,908 - INFO - Finished converting document 4_2024-01-22 in 0.05 sec.
2025-11-14 17:51:24,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\V\4_2024-01-03' --> 'data\processed_data\V\4_2024-01-03.md'
Converted 'data\edgar_documents\V\4_2024-01-16' --> 'data\processed_data\V\4_2024-01-16.md'
Converted 'data\edgar_documents\V\4_2024-01-22' --> 'data\processed_data\V\4_2024-01-22.md'


2025-11-14 17:51:24,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:25,004 - INFO - Going to convert document batch...
2025-11-14 17:51:25,005 - INFO - Processing document 4_2024-02-05
2025-11-14 17:51:25,029 - INFO - Finished converting document 4_2024-02-05 in 0.05 sec.
2025-11-14 17:51:25,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:25,070 - INFO - Going to convert document batch...
2025-11-14 17:51:25,071 - INFO - Processing document 4_2024-02-08
2025-11-14 17:51:25,089 - INFO - Finished converting document 4_2024-02-08 in 0.05 sec.
2025-11-14 17:51:25,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:25,127 - INFO - Going to convert document batch...
2025-11-14 17:51:25,130 - INFO - Processing document 4_2024-02-16
2025-11-14 17:51:25,150 - INFO - Finished converting document 4_2024-02-16 in 0.03 sec.


Converted 'data\edgar_documents\V\4_2024-01-24' --> 'data\processed_data\V\4_2024-01-24.md'
Converted 'data\edgar_documents\V\4_2024-02-05' --> 'data\processed_data\V\4_2024-02-05.md'
Converted 'data\edgar_documents\V\4_2024-02-08' --> 'data\processed_data\V\4_2024-02-08.md'


2025-11-14 17:51:25,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:25,191 - INFO - Going to convert document batch...
2025-11-14 17:51:25,192 - INFO - Processing document 4_2024-03-04
2025-11-14 17:51:25,224 - INFO - Finished converting document 4_2024-03-04 in 0.05 sec.
2025-11-14 17:51:25,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:25,295 - INFO - Going to convert document batch...
2025-11-14 17:51:25,296 - INFO - Processing document 4_2024-04-01
2025-11-14 17:51:25,319 - INFO - Finished converting document 4_2024-04-01 in 0.05 sec.


Converted 'data\edgar_documents\V\4_2024-02-16' --> 'data\processed_data\V\4_2024-02-16.md'
Converted 'data\edgar_documents\V\4_2024-03-04' --> 'data\processed_data\V\4_2024-03-04.md'
Converted 'data\edgar_documents\V\4_2024-04-01' --> 'data\processed_data\V\4_2024-04-01.md'


2025-11-14 17:51:25,388 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:51:25,389 - ERROR - Input document 4_2024-04-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:51:25,391 - INFO - Going to convert document batch...
2025-11-14 17:51:25,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\V\4_2024-04-08: File format not allowed: data\edgar_documents\V\4_2024-04-08


2025-11-14 17:51:25,740 - INFO - Going to convert document batch...
2025-11-14 17:51:25,740 - INFO - Processing document 4_2024-04-26
2025-11-14 17:51:25,757 - INFO - Finished converting document 4_2024-04-26 in 0.36 sec.
2025-11-14 17:51:25,790 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:51:25,791 - ERROR - Input document 4_2024-05-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:51:25,792 - INFO - Going to convert document batch...
2025-11-14 17:51:25,804 - IN

Converted 'data\edgar_documents\V\4_2024-04-26' --> 'data\processed_data\V\4_2024-04-26.md'
Error processing data\edgar_documents\V\4_2024-05-06: File format not allowed: data\edgar_documents\V\4_2024-05-06
Converted 'data\edgar_documents\V\4_2024-05-15' --> 'data\processed_data\V\4_2024-05-15.md'
Converted 'data\edgar_documents\V\4_2024-08-16' --> 'data\processed_data\V\4_2024-08-16.md'
Converted 'data\edgar_documents\V\4_2024-08-20' --> 'data\processed_data\V\4_2024-08-20.md'


2025-11-14 17:51:25,994 - INFO - Going to convert document batch...
2025-11-14 17:51:25,995 - INFO - Processing document 4_2024-08-30
2025-11-14 17:51:26,018 - INFO - Finished converting document 4_2024-08-30 in 0.05 sec.
2025-11-14 17:51:26,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,060 - INFO - Going to convert document batch...
2025-11-14 17:51:26,061 - INFO - Processing document 4_2024-09-04
2025-11-14 17:51:26,086 - INFO - Finished converting document 4_2024-09-04 in 0.05 sec.
2025-11-14 17:51:26,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,150 - INFO - Going to convert document batch...
2025-11-14 17:51:26,151 - INFO - Processing document 4_2024-10-02
2025-11-14 17:51:26,177 - INFO - Finished converting document 4_2024-10-02 in 0.06 sec.
2025-11-14 17:51:26,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,218 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\V\4_2024-08-30' --> 'data\processed_data\V\4_2024-08-30.md'
Converted 'data\edgar_documents\V\4_2024-09-04' --> 'data\processed_data\V\4_2024-09-04.md'
Converted 'data\edgar_documents\V\4_2024-10-02' --> 'data\processed_data\V\4_2024-10-02.md'


2025-11-14 17:51:26,219 - INFO - Processing document 4_2024-11-01
2025-11-14 17:51:26,240 - INFO - Finished converting document 4_2024-11-01 in 0.03 sec.
2025-11-14 17:51:26,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,294 - INFO - Going to convert document batch...
2025-11-14 17:51:26,296 - INFO - Processing document 4_2024-11-21
2025-11-14 17:51:26,329 - INFO - Finished converting document 4_2024-11-21 in 0.06 sec.
2025-11-14 17:51:26,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,388 - INFO - Going to convert document batch...
2025-11-14 17:51:26,389 - INFO - Processing document 4_2024-11-22
2025-11-14 17:51:26,409 - INFO - Finished converting document 4_2024-11-22 in 0.05 sec.
2025-11-14 17:51:26,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,449 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\V\4_2024-11-01' --> 'data\processed_data\V\4_2024-11-01.md'
Converted 'data\edgar_documents\V\4_2024-11-21' --> 'data\processed_data\V\4_2024-11-21.md'
Converted 'data\edgar_documents\V\4_2024-11-22' --> 'data\processed_data\V\4_2024-11-22.md'


2025-11-14 17:51:26,450 - INFO - Processing document 4_2024-11-25
2025-11-14 17:51:26,467 - INFO - Finished converting document 4_2024-11-25 in 0.05 sec.
2025-11-14 17:51:26,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,525 - INFO - Going to convert document batch...
2025-11-14 17:51:26,527 - INFO - Processing document 4_2024-12-03
2025-11-14 17:51:26,560 - INFO - Finished converting document 4_2024-12-03 in 0.08 sec.
2025-11-14 17:51:26,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,606 - INFO - Going to convert document batch...
2025-11-14 17:51:26,606 - INFO - Processing document 4_2024-12-13
2025-11-14 17:51:26,623 - INFO - Finished converting document 4_2024-12-13 in 0.05 sec.
2025-11-14 17:51:26,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,663 - INFO - Going to convert document batch...
2025-11-14 17:51:26,664 - INFO - Processing document 4_2025-01-03
2025-11-14 17:51:26,685 - IN

Converted 'data\edgar_documents\V\4_2024-11-25' --> 'data\processed_data\V\4_2024-11-25.md'
Converted 'data\edgar_documents\V\4_2024-12-03' --> 'data\processed_data\V\4_2024-12-03.md'
Converted 'data\edgar_documents\V\4_2024-12-13' --> 'data\processed_data\V\4_2024-12-13.md'


2025-11-14 17:51:26,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,739 - INFO - Going to convert document batch...
2025-11-14 17:51:26,740 - INFO - Processing document 4_2025-01-29
2025-11-14 17:51:26,758 - INFO - Finished converting document 4_2025-01-29 in 0.05 sec.
2025-11-14 17:51:26,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,812 - INFO - Going to convert document batch...
2025-11-14 17:51:26,814 - INFO - Processing document 4_2025-02-04
2025-11-14 17:51:26,836 - INFO - Finished converting document 4_2025-02-04 in 0.05 sec.
2025-11-14 17:51:26,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\4_2025-01-03' --> 'data\processed_data\V\4_2025-01-03.md'
Converted 'data\edgar_documents\V\4_2025-01-29' --> 'data\processed_data\V\4_2025-01-29.md'
Converted 'data\edgar_documents\V\4_2025-02-04' --> 'data\processed_data\V\4_2025-02-04.md'


2025-11-14 17:51:26,896 - INFO - Going to convert document batch...
2025-11-14 17:51:26,897 - INFO - Processing document 4_2025-02-07
2025-11-14 17:51:26,914 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.
2025-11-14 17:51:26,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:26,956 - INFO - Going to convert document batch...
2025-11-14 17:51:26,957 - INFO - Processing document 4_2025-02-18
2025-11-14 17:51:26,978 - INFO - Finished converting document 4_2025-02-18 in 0.03 sec.
2025-11-14 17:51:27,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,020 - INFO - Going to convert document batch...
2025-11-14 17:51:27,021 - INFO - Processing document 4_2025-03-04
2025-11-14 17:51:27,067 - INFO - Finished converting document 4_2025-03-04 in 0.06 sec.
2025-11-14 17:51:27,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,116 - INFO - Going to convert document batch...
2025-11-14 17:51:27,116 - 

Converted 'data\edgar_documents\V\4_2025-02-07' --> 'data\processed_data\V\4_2025-02-07.md'
Converted 'data\edgar_documents\V\4_2025-02-18' --> 'data\processed_data\V\4_2025-02-18.md'
Converted 'data\edgar_documents\V\4_2025-03-04' --> 'data\processed_data\V\4_2025-03-04.md'


2025-11-14 17:51:27,140 - INFO - Finished converting document 4_2025-03-14 in 0.05 sec.
2025-11-14 17:51:27,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,189 - INFO - Going to convert document batch...
2025-11-14 17:51:27,190 - INFO - Processing document 4_2025-03-20
2025-11-14 17:51:27,212 - INFO - Finished converting document 4_2025-03-20 in 0.03 sec.
2025-11-14 17:51:27,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,256 - INFO - Going to convert document batch...
2025-11-14 17:51:27,257 - INFO - Processing document 4_2025-04-03
2025-11-14 17:51:27,282 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.
2025-11-14 17:51:27,327 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:51:27,327 - ERROR - Input document 4_2025-04-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFo

Converted 'data\edgar_documents\V\4_2025-03-14' --> 'data\processed_data\V\4_2025-03-14.md'
Converted 'data\edgar_documents\V\4_2025-03-20' --> 'data\processed_data\V\4_2025-03-20.md'
Converted 'data\edgar_documents\V\4_2025-04-03' --> 'data\processed_data\V\4_2025-04-03.md'
Error processing data\edgar_documents\V\4_2025-04-30: File format not allowed: data\edgar_documents\V\4_2025-04-30


2025-11-14 17:51:27,355 - ERROR - Input document 4_2025-05-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:51:27,356 - INFO - Going to convert document batch...
2025-11-14 17:51:27,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,377 - INFO - Going to convert document batch...
2025-11-14 17:51:27,378 - INFO - Processing document 4_2025-05-02
2025-11-14 17:51:27,401 - INFO - Finished converting document 4_2025-05-02 in 0.05 sec.
2025-11-14 17:51:27,467 - INFO - detec

Error processing data\edgar_documents\V\4_2025-05-01: File format not allowed: data\edgar_documents\V\4_2025-05-01
Converted 'data\edgar_documents\V\4_2025-05-02' --> 'data\processed_data\V\4_2025-05-02.md'
Converted 'data\edgar_documents\V\4_2025-05-09' --> 'data\processed_data\V\4_2025-05-09.md'


2025-11-14 17:51:27,553 - INFO - Going to convert document batch...
2025-11-14 17:51:27,553 - INFO - Processing document 4_2025-05-12
2025-11-14 17:51:27,574 - INFO - Finished converting document 4_2025-05-12 in 0.05 sec.
2025-11-14 17:51:27,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,622 - INFO - Going to convert document batch...
2025-11-14 17:51:27,623 - INFO - Processing document 4_2025-06-04
2025-11-14 17:51:27,644 - INFO - Finished converting document 4_2025-06-04 in 0.05 sec.
2025-11-14 17:51:27,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,689 - INFO - Going to convert document batch...
2025-11-14 17:51:27,690 - INFO - Processing document 4_2025-06-05
2025-11-14 17:51:27,717 - INFO - Finished converting document 4_2025-06-05 in 0.05 sec.
2025-11-14 17:51:27,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,766 - INFO - Going to convert document batch...
2025-11-14 17:51:27,767 - 

Converted 'data\edgar_documents\V\4_2025-05-12' --> 'data\processed_data\V\4_2025-05-12.md'
Converted 'data\edgar_documents\V\4_2025-06-04' --> 'data\processed_data\V\4_2025-06-04.md'
Converted 'data\edgar_documents\V\4_2025-06-05' --> 'data\processed_data\V\4_2025-06-05.md'


2025-11-14 17:51:27,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,838 - INFO - Going to convert document batch...
2025-11-14 17:51:27,839 - INFO - Processing document 4_2025-06-12
2025-11-14 17:51:27,861 - INFO - Finished converting document 4_2025-06-12 in 0.05 sec.
2025-11-14 17:51:27,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,908 - INFO - Going to convert document batch...
2025-11-14 17:51:27,909 - INFO - Processing document 4_2025-07-02
2025-11-14 17:51:27,932 - INFO - Finished converting document 4_2025-07-02 in 0.06 sec.
2025-11-14 17:51:27,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:27,991 - INFO - Going to convert document batch...
2025-11-14 17:51:27,992 - INFO - Processing document 4_2025-08-15
2025-11-14 17:51:28,014 - INFO - Finished converting document 4_2025-08-15 in 0.06 sec.


Converted 'data\edgar_documents\V\4_2025-06-06' --> 'data\processed_data\V\4_2025-06-06.md'
Converted 'data\edgar_documents\V\4_2025-06-12' --> 'data\processed_data\V\4_2025-06-12.md'
Converted 'data\edgar_documents\V\4_2025-07-02' --> 'data\processed_data\V\4_2025-07-02.md'


2025-11-14 17:51:28,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,057 - INFO - Going to convert document batch...
2025-11-14 17:51:28,058 - INFO - Processing document 4_2025-08-19
2025-11-14 17:51:28,081 - INFO - Finished converting document 4_2025-08-19 in 0.05 sec.
2025-11-14 17:51:28,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,129 - INFO - Going to convert document batch...
2025-11-14 17:51:28,130 - INFO - Processing document 4_2025-09-03
2025-11-14 17:51:28,154 - INFO - Finished converting document 4_2025-09-03 in 0.05 sec.
2025-11-14 17:51:28,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,198 - INFO - Going to convert document batch...
2025-11-14 17:51:28,198 - INFO - Processing document 4_2025-10-02
2025-11-14 17:51:28,220 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.


Converted 'data\edgar_documents\V\4_2025-08-15' --> 'data\processed_data\V\4_2025-08-15.md'
Converted 'data\edgar_documents\V\4_2025-08-19' --> 'data\processed_data\V\4_2025-08-19.md'
Converted 'data\edgar_documents\V\4_2025-09-03' --> 'data\processed_data\V\4_2025-09-03.md'


2025-11-14 17:51:28,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,261 - INFO - Going to convert document batch...
2025-11-14 17:51:28,262 - INFO - Processing document 4_2025-10-16
2025-11-14 17:51:28,279 - INFO - Finished converting document 4_2025-10-16 in 0.03 sec.
2025-11-14 17:51:28,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,322 - INFO - Going to convert document batch...
2025-11-14 17:51:28,323 - INFO - Processing document 4_2025-11-04
2025-11-14 17:51:28,348 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 17:51:28,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,394 - INFO - Going to convert document batch...
2025-11-14 17:51:28,395 - INFO - Processing document 4_2025-11-05
2025-11-14 17:51:28,415 - INFO - Finished converting document 4_2025-11-05 in 0.03 sec.


Converted 'data\edgar_documents\V\4_2025-10-02' --> 'data\processed_data\V\4_2025-10-02.md'
Converted 'data\edgar_documents\V\4_2025-10-16' --> 'data\processed_data\V\4_2025-10-16.md'
Converted 'data\edgar_documents\V\4_2025-11-04' --> 'data\processed_data\V\4_2025-11-04.md'
Converted 'data\edgar_documents\V\4_2025-11-05' --> 'data\processed_data\V\4_2025-11-05.md'


2025-11-14 17:51:28,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,493 - INFO - Going to convert document batch...
2025-11-14 17:51:28,494 - INFO - Processing document 8-K_2023-01-05
2025-11-14 17:51:28,520 - INFO - Finished converting document 8-K_2023-01-05 in 0.08 sec.
2025-11-14 17:51:28,550 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,579 - INFO - Going to convert document batch...
2025-11-14 17:51:28,579 - INFO - Processing document 8-K_2023-01-25
2025-11-14 17:51:28,622 - INFO - Finished converting document 8-K_2023-01-25 in 0.09 sec.
2025-11-14 17:51:28,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,672 - INFO - Going to convert document batch...
2025-11-14 17:51:28,673 - INFO - Processing document 8-K_2023-01-26
2025-11-14 17:51:28,697 - INFO - Finished converting document 8-K_2023-01-26 in 0.06 sec.
2025-11-14 17:51:28,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\8-K_2023-01-05' --> 'data\processed_data\V\8-K_2023-01-05.md'
Converted 'data\edgar_documents\V\8-K_2023-01-25' --> 'data\processed_data\V\8-K_2023-01-25.md'
Converted 'data\edgar_documents\V\8-K_2023-01-26' --> 'data\processed_data\V\8-K_2023-01-26.md'


2025-11-14 17:51:28,738 - INFO - Going to convert document batch...
2025-11-14 17:51:28,739 - INFO - Processing document 8-K_2023-02-01
2025-11-14 17:51:28,761 - INFO - Finished converting document 8-K_2023-02-01 in 0.06 sec.
2025-11-14 17:51:28,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,816 - INFO - Going to convert document batch...
2025-11-14 17:51:28,818 - INFO - Processing document 8-K_2023-02-16
2025-11-14 17:51:28,849 - INFO - Finished converting document 8-K_2023-02-16 in 0.08 sec.
2025-11-14 17:51:28,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:28,923 - INFO - Going to convert document batch...
2025-11-14 17:51:28,923 - INFO - Processing document 8-K_2023-03-03
2025-11-14 17:51:28,969 - INFO - Finished converting document 8-K_2023-03-03 in 0.11 sec.


Converted 'data\edgar_documents\V\8-K_2023-02-01' --> 'data\processed_data\V\8-K_2023-02-01.md'
Converted 'data\edgar_documents\V\8-K_2023-02-16' --> 'data\processed_data\V\8-K_2023-02-16.md'


2025-11-14 17:51:29,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:29,020 - INFO - Going to convert document batch...
2025-11-14 17:51:29,021 - INFO - Processing document 8-K_2023-04-10
2025-11-14 17:51:29,046 - INFO - Finished converting document 8-K_2023-04-10 in 0.06 sec.
2025-11-14 17:51:29,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:29,089 - INFO - Going to convert document batch...
2025-11-14 17:51:29,090 - INFO - Processing document 8-K_2023-04-25
2025-11-14 17:51:29,118 - INFO - Finished converting document 8-K_2023-04-25 in 0.05 sec.
2025-11-14 17:51:29,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:29,189 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\V\8-K_2023-03-03' --> 'data\processed_data\V\8-K_2023-03-03.md'
Converted 'data\edgar_documents\V\8-K_2023-04-10' --> 'data\processed_data\V\8-K_2023-04-10.md'
Converted 'data\edgar_documents\V\8-K_2023-04-25' --> 'data\processed_data\V\8-K_2023-04-25.md'


2025-11-14 17:51:29,190 - INFO - Processing document 8-K_2023-05-30
2025-11-14 17:51:29,243 - INFO - Finished converting document 8-K_2023-05-30 in 0.09 sec.
2025-11-14 17:51:29,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:29,302 - INFO - Going to convert document batch...
2025-11-14 17:51:29,303 - INFO - Processing document 8-K_2023-06-20
2025-11-14 17:51:29,329 - INFO - Finished converting document 8-K_2023-06-20 in 0.06 sec.
2025-11-14 17:51:29,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:29,367 - INFO - Going to convert document batch...
2025-11-14 17:51:29,368 - INFO - Processing document 8-K_2023-06-23


Converted 'data\edgar_documents\V\8-K_2023-05-30' --> 'data\processed_data\V\8-K_2023-05-30.md'
Converted 'data\edgar_documents\V\8-K_2023-06-20' --> 'data\processed_data\V\8-K_2023-06-20.md'


2025-11-14 17:51:29,631 - INFO - Finished converting document 8-K_2023-06-23 in 0.28 sec.
2025-11-14 17:51:29,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:29,665 - INFO - Going to convert document batch...
2025-11-14 17:51:29,666 - INFO - Processing document 8-K_2023-06-29
2025-11-14 17:51:29,686 - INFO - Finished converting document 8-K_2023-06-29 in 0.05 sec.
2025-11-14 17:51:29,711 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:29,731 - INFO - Going to convert document batch...
2025-11-14 17:51:29,732 - INFO - Processing document 8-K_2023-07-25
2025-11-14 17:51:29,757 - INFO - Finished converting document 8-K_2023-07-25 in 0.05 sec.
2025-11-14 17:51:29,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:29,809 - INFO - Going to convert document batch...
2025-11-14 17:51:29,810 - INFO - Processing document 8-K_2023-08-30


Converted 'data\edgar_documents\V\8-K_2023-06-23' --> 'data\processed_data\V\8-K_2023-06-23.md'
Converted 'data\edgar_documents\V\8-K_2023-06-29' --> 'data\processed_data\V\8-K_2023-06-29.md'
Converted 'data\edgar_documents\V\8-K_2023-07-25' --> 'data\processed_data\V\8-K_2023-07-25.md'


2025-11-14 17:51:29,857 - INFO - Finished converting document 8-K_2023-08-30 in 0.09 sec.
2025-11-14 17:51:29,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:29,912 - INFO - Going to convert document batch...
2025-11-14 17:51:29,913 - INFO - Processing document 8-K_2023-09-13
2025-11-14 17:51:29,950 - INFO - Finished converting document 8-K_2023-09-13 in 0.08 sec.
2025-11-14 17:51:30,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,021 - INFO - Going to convert document batch...
2025-11-14 17:51:30,021 - INFO - Processing document 8-K_2023-10-02
2025-11-14 17:51:30,043 - INFO - Finished converting document 8-K_2023-10-02 in 0.08 sec.
2025-11-14 17:51:30,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\8-K_2023-08-30' --> 'data\processed_data\V\8-K_2023-08-30.md'
Converted 'data\edgar_documents\V\8-K_2023-09-13' --> 'data\processed_data\V\8-K_2023-09-13.md'
Converted 'data\edgar_documents\V\8-K_2023-10-02' --> 'data\processed_data\V\8-K_2023-10-02.md'


2025-11-14 17:51:30,079 - INFO - Going to convert document batch...
2025-11-14 17:51:30,080 - INFO - Processing document 8-K_2023-10-18
2025-11-14 17:51:30,104 - INFO - Finished converting document 8-K_2023-10-18 in 0.06 sec.
2025-11-14 17:51:30,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,146 - INFO - Going to convert document batch...
2025-11-14 17:51:30,147 - INFO - Processing document 8-K_2023-10-24
2025-11-14 17:51:30,173 - INFO - Finished converting document 8-K_2023-10-24 in 0.06 sec.
2025-11-14 17:51:30,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,249 - INFO - Going to convert document batch...
2025-11-14 17:51:30,250 - INFO - Processing document 8-K_2024-01-24


Converted 'data\edgar_documents\V\8-K_2023-10-18' --> 'data\processed_data\V\8-K_2023-10-18.md'
Converted 'data\edgar_documents\V\8-K_2023-10-24' --> 'data\processed_data\V\8-K_2023-10-24.md'


2025-11-14 17:51:30,320 - INFO - Finished converting document 8-K_2024-01-24 in 0.12 sec.
2025-11-14 17:51:30,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,385 - INFO - Going to convert document batch...
2025-11-14 17:51:30,386 - INFO - Processing document 8-K_2024-01-25
2025-11-14 17:51:30,430 - INFO - Finished converting document 8-K_2024-01-25 in 0.08 sec.
2025-11-14 17:51:30,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,475 - INFO - Going to convert document batch...
2025-11-14 17:51:30,476 - INFO - Processing document 8-K_2024-03-26
2025-11-14 17:51:30,505 - INFO - Finished converting document 8-K_2024-03-26 in 0.06 sec.
2025-11-14 17:51:30,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\8-K_2024-01-24' --> 'data\processed_data\V\8-K_2024-01-24.md'
Converted 'data\edgar_documents\V\8-K_2024-01-25' --> 'data\processed_data\V\8-K_2024-01-25.md'
Converted 'data\edgar_documents\V\8-K_2024-03-26' --> 'data\processed_data\V\8-K_2024-03-26.md'


2025-11-14 17:51:30,547 - INFO - Going to convert document batch...
2025-11-14 17:51:30,547 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:51:30,573 - INFO - Finished converting document 8-K_2024-04-23 in 0.06 sec.
2025-11-14 17:51:30,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,611 - INFO - Going to convert document batch...
2025-11-14 17:51:30,612 - INFO - Processing document 8-K_2024-05-06
2025-11-14 17:51:30,631 - INFO - Finished converting document 8-K_2024-05-06 in 0.05 sec.
2025-11-14 17:51:30,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,667 - INFO - Going to convert document batch...
2025-11-14 17:51:30,668 - INFO - Processing document 8-K_2024-05-08
2025-11-14 17:51:30,688 - INFO - Finished converting document 8-K_2024-05-08 in 0.05 sec.
2025-11-14 17:51:30,711 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,721 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\V\8-K_2024-04-23' --> 'data\processed_data\V\8-K_2024-04-23.md'
Converted 'data\edgar_documents\V\8-K_2024-05-06' --> 'data\processed_data\V\8-K_2024-05-06.md'
Converted 'data\edgar_documents\V\8-K_2024-05-08' --> 'data\processed_data\V\8-K_2024-05-08.md'
Converted 'data\edgar_documents\V\8-K_2024-07-10' --> 'data\processed_data\V\8-K_2024-07-10.md'


2025-11-14 17:51:30,777 - INFO - Going to convert document batch...
2025-11-14 17:51:30,777 - INFO - Processing document 8-K_2024-07-23
2025-11-14 17:51:30,802 - INFO - Finished converting document 8-K_2024-07-23 in 0.05 sec.
2025-11-14 17:51:30,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,871 - INFO - Going to convert document batch...
2025-11-14 17:51:30,872 - INFO - Processing document 8-K_2024-09-26
2025-11-14 17:51:30,899 - INFO - Finished converting document 8-K_2024-09-26 in 0.08 sec.
2025-11-14 17:51:30,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,932 - INFO - Going to convert document batch...
2025-11-14 17:51:30,933 - INFO - Processing document 8-K_2024-10-11
2025-11-14 17:51:30,953 - INFO - Finished converting document 8-K_2024-10-11 in 0.05 sec.
2025-11-14 17:51:30,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:30,988 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\V\8-K_2024-07-23' --> 'data\processed_data\V\8-K_2024-07-23.md'
Converted 'data\edgar_documents\V\8-K_2024-09-26' --> 'data\processed_data\V\8-K_2024-09-26.md'
Converted 'data\edgar_documents\V\8-K_2024-10-11' --> 'data\processed_data\V\8-K_2024-10-11.md'


2025-11-14 17:51:31,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,073 - INFO - Going to convert document batch...
2025-11-14 17:51:31,074 - INFO - Processing document 8-K_2025-01-29
2025-11-14 17:51:31,133 - INFO - Finished converting document 8-K_2025-01-29 in 0.09 sec.
2025-11-14 17:51:31,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,202 - INFO - Going to convert document batch...
2025-11-14 17:51:31,202 - INFO - Processing document 8-K_2025-01-30
2025-11-14 17:51:31,229 - INFO - Finished converting document 8-K_2025-01-30 in 0.08 sec.


Converted 'data\edgar_documents\V\8-K_2024-10-29' --> 'data\processed_data\V\8-K_2024-10-29.md'
Converted 'data\edgar_documents\V\8-K_2025-01-29' --> 'data\processed_data\V\8-K_2025-01-29.md'


2025-11-14 17:51:31,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,263 - INFO - Going to convert document batch...
2025-11-14 17:51:31,264 - INFO - Processing document 8-K_2025-03-31
2025-11-14 17:51:31,286 - INFO - Finished converting document 8-K_2025-03-31 in 0.05 sec.
2025-11-14 17:51:31,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,323 - INFO - Going to convert document batch...
2025-11-14 17:51:31,324 - INFO - Processing document 8-K_2025-04-29
2025-11-14 17:51:31,350 - INFO - Finished converting document 8-K_2025-04-29 in 0.05 sec.
2025-11-14 17:51:31,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,388 - INFO - Going to convert document batch...
2025-11-14 17:51:31,389 - INFO - Processing document 8-K_2025-05-15
2025-11-14 17:51:31,414 - INFO - Finished converting document 8-K_2025-05-15 in 0.05 sec.


Converted 'data\edgar_documents\V\8-K_2025-01-30' --> 'data\processed_data\V\8-K_2025-01-30.md'
Converted 'data\edgar_documents\V\8-K_2025-03-31' --> 'data\processed_data\V\8-K_2025-03-31.md'
Converted 'data\edgar_documents\V\8-K_2025-04-29' --> 'data\processed_data\V\8-K_2025-04-29.md'


2025-11-14 17:51:31,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,474 - INFO - Going to convert document batch...
2025-11-14 17:51:31,475 - INFO - Processing document 8-K_2025-07-23
2025-11-14 17:51:31,502 - INFO - Finished converting document 8-K_2025-07-23 in 0.06 sec.
2025-11-14 17:51:31,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,547 - INFO - Going to convert document batch...
2025-11-14 17:51:31,548 - INFO - Processing document 8-K_2025-07-29
2025-11-14 17:51:31,581 - INFO - Finished converting document 8-K_2025-07-29 in 0.06 sec.
2025-11-14 17:51:31,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,625 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\V\8-K_2025-05-15' --> 'data\processed_data\V\8-K_2025-05-15.md'
Converted 'data\edgar_documents\V\8-K_2025-07-23' --> 'data\processed_data\V\8-K_2025-07-23.md'
Converted 'data\edgar_documents\V\8-K_2025-07-29' --> 'data\processed_data\V\8-K_2025-07-29.md'


2025-11-14 17:51:31,626 - INFO - Processing document 8-K_2025-08-08
2025-11-14 17:51:31,650 - INFO - Finished converting document 8-K_2025-08-08 in 0.05 sec.
2025-11-14 17:51:31,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,709 - INFO - Going to convert document batch...
2025-11-14 17:51:31,711 - INFO - Processing document 8-K_2025-09-19
2025-11-14 17:51:31,743 - INFO - Finished converting document 8-K_2025-09-19 in 0.08 sec.
2025-11-14 17:51:31,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,783 - INFO - Going to convert document batch...
2025-11-14 17:51:31,784 - INFO - Processing document 8-K_2025-09-26
2025-11-14 17:51:31,812 - INFO - Finished converting document 8-K_2025-09-26 in 0.06 sec.
2025-11-14 17:51:31,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,849 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\V\8-K_2025-08-08' --> 'data\processed_data\V\8-K_2025-08-08.md'
Converted 'data\edgar_documents\V\8-K_2025-09-19' --> 'data\processed_data\V\8-K_2025-09-19.md'
Converted 'data\edgar_documents\V\8-K_2025-09-26' --> 'data\processed_data\V\8-K_2025-09-26.md'


2025-11-14 17:51:31,850 - INFO - Processing document 8-K_2025-09-29
2025-11-14 17:51:31,877 - INFO - Finished converting document 8-K_2025-09-29 in 0.05 sec.
2025-11-14 17:51:31,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,921 - INFO - Going to convert document batch...
2025-11-14 17:51:31,922 - INFO - Processing document 8-K_2025-10-28
2025-11-14 17:51:31,950 - INFO - Finished converting document 8-K_2025-10-28 in 0.06 sec.
2025-11-14 17:51:31,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:31,989 - INFO - Going to convert document batch...
2025-11-14 17:51:31,990 - INFO - Processing document 8-K_2025-11-10
2025-11-14 17:51:32,018 - INFO - Finished converting document 8-K_2025-11-10 in 0.06 sec.


Converted 'data\edgar_documents\V\8-K_2025-09-29' --> 'data\processed_data\V\8-K_2025-09-29.md'
Converted 'data\edgar_documents\V\8-K_2025-10-28' --> 'data\processed_data\V\8-K_2025-10-28.md'
Converted 'data\edgar_documents\V\8-K_2025-11-10' --> 'data\processed_data\V\8-K_2025-11-10.md'


2025-11-14 17:51:32,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:51:33,820 - INFO - Going to convert document batch...
2025-11-14 17:51:33,821 - INFO - Processing document DEF-14A_2023-12-07
2025-11-14 17:51:35,923 - INFO - Finished converting document DEF-14A_2023-12-07 in 3.89 sec.
2025-11-14 17:51:37,511 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\DEF-14A_2023-12-07' --> 'data\processed_data\V\DEF-14A_2023-12-07.md'


2025-11-14 17:51:38,141 - INFO - Going to convert document batch...
2025-11-14 17:51:38,142 - INFO - Processing document DEF-14A_2024-12-09
2025-11-14 17:51:50,001 - INFO - Finished converting document DEF-14A_2024-12-09 in 12.56 sec.
2025-11-14 17:51:51,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\V\DEF-14A_2024-12-09' --> 'data\processed_data\V\DEF-14A_2024-12-09.md'
Processed 127 new files. Errors: 6
Found 213 files to process in data\edgar_documents\VZ


2025-11-14 17:51:52,351 - INFO - Going to convert document batch...
2025-11-14 17:51:52,351 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:51:52,351 - INFO - Processing document 10-K_2023-02-10
2025-11-14 17:51:55,414 - INFO - Finished converting document 10-K_2023-02-10 in 4.17 sec.
2025-11-14 17:51:56,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-K_2023-02-10' --> 'data\processed_data\VZ\10-K_2023-02-10.md'


2025-11-14 17:51:57,836 - INFO - Going to convert document batch...
2025-11-14 17:51:57,838 - INFO - Processing document 10-K_2024-02-09
2025-11-14 17:52:01,067 - INFO - Finished converting document 10-K_2024-02-09 in 4.80 sec.


Converted 'data\edgar_documents\VZ\10-K_2024-02-09' --> 'data\processed_data\VZ\10-K_2024-02-09.md'


2025-11-14 17:52:02,276 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:03,242 - INFO - Going to convert document batch...
2025-11-14 17:52:03,243 - INFO - Processing document 10-K_2025-02-12
2025-11-14 17:52:06,816 - INFO - Finished converting document 10-K_2025-02-12 in 4.86 sec.
2025-11-14 17:52:07,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-K_2025-02-12' --> 'data\processed_data\VZ\10-K_2025-02-12.md'


2025-11-14 17:52:08,268 - INFO - Going to convert document batch...
2025-11-14 17:52:08,270 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 17:52:09,170 - INFO - Finished converting document 10-Q_2023-04-27 in 1.42 sec.
2025-11-14 17:52:09,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-Q_2023-04-27' --> 'data\processed_data\VZ\10-Q_2023-04-27.md'


2025-11-14 17:52:10,771 - INFO - Going to convert document batch...
2025-11-14 17:52:10,773 - INFO - Processing document 10-Q_2023-07-28
2025-11-14 17:52:11,873 - INFO - Finished converting document 10-Q_2023-07-28 in 2.25 sec.
2025-11-14 17:52:12,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-Q_2023-07-28' --> 'data\processed_data\VZ\10-Q_2023-07-28.md'


2025-11-14 17:52:13,412 - INFO - Going to convert document batch...
2025-11-14 17:52:13,416 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 17:52:14,578 - INFO - Finished converting document 10-Q_2023-10-26 in 2.16 sec.
2025-11-14 17:52:15,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-Q_2023-10-26' --> 'data\processed_data\VZ\10-Q_2023-10-26.md'


2025-11-14 17:52:15,755 - INFO - Going to convert document batch...
2025-11-14 17:52:15,756 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 17:52:17,144 - INFO - Finished converting document 10-Q_2024-04-25 in 1.97 sec.
2025-11-14 17:52:17,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-Q_2024-04-25' --> 'data\processed_data\VZ\10-Q_2024-04-25.md'


2025-11-14 17:52:18,247 - INFO - Going to convert document batch...
2025-11-14 17:52:18,248 - INFO - Processing document 10-Q_2024-07-25
2025-11-14 17:52:19,357 - INFO - Finished converting document 10-Q_2024-07-25 in 1.75 sec.
2025-11-14 17:52:20,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-Q_2024-07-25' --> 'data\processed_data\VZ\10-Q_2024-07-25.md'


2025-11-14 17:52:21,105 - INFO - Going to convert document batch...
2025-11-14 17:52:21,106 - INFO - Processing document 10-Q_2024-10-25
2025-11-14 17:52:22,304 - INFO - Finished converting document 10-Q_2024-10-25 in 1.88 sec.
2025-11-14 17:52:22,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-Q_2024-10-25' --> 'data\processed_data\VZ\10-Q_2024-10-25.md'


2025-11-14 17:52:23,762 - INFO - Going to convert document batch...
2025-11-14 17:52:23,763 - INFO - Processing document 10-Q_2025-04-25
2025-11-14 17:52:24,790 - INFO - Finished converting document 10-Q_2025-04-25 in 1.91 sec.
2025-11-14 17:52:25,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-Q_2025-04-25' --> 'data\processed_data\VZ\10-Q_2025-04-25.md'


2025-11-14 17:52:26,257 - INFO - Going to convert document batch...
2025-11-14 17:52:26,258 - INFO - Processing document 10-Q_2025-07-25
2025-11-14 17:52:27,533 - INFO - Finished converting document 10-Q_2025-07-25 in 2.25 sec.
2025-11-14 17:52:28,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\10-Q_2025-07-25' --> 'data\processed_data\VZ\10-Q_2025-07-25.md'


2025-11-14 17:52:29,048 - INFO - Going to convert document batch...
2025-11-14 17:52:29,049 - INFO - Processing document 10-Q_2025-10-29
2025-11-14 17:52:30,373 - INFO - Finished converting document 10-Q_2025-10-29 in 2.27 sec.
2025-11-14 17:52:30,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:30,970 - INFO - Going to convert document batch...
2025-11-14 17:52:30,971 - INFO - Processing document 4_2023-01-06
2025-11-14 17:52:30,991 - INFO - Finished converting document 4_2023-01-06 in 0.03 sec.
2025-11-14 17:52:31,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:31,035 - INFO - Going to convert document batch...
2025-11-14 17:52:31,035 - INFO - Processing document 4_2023-01-09
2025-11-14 17:52:31,052 - INFO - Finished converting document 4_2023-01-09 in 0.03 sec.
2025-11-14 17:52:31,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:31,114 - INFO - Going to convert document batch...
2025-11-14 17:52:31,

Converted 'data\edgar_documents\VZ\10-Q_2025-10-29' --> 'data\processed_data\VZ\10-Q_2025-10-29.md'
Converted 'data\edgar_documents\VZ\4_2023-01-06' --> 'data\processed_data\VZ\4_2023-01-06.md'
Converted 'data\edgar_documents\VZ\4_2023-01-09' --> 'data\processed_data\VZ\4_2023-01-09.md'
Converted 'data\edgar_documents\VZ\4_2023-01-23' --> 'data\processed_data\VZ\4_2023-01-23.md'


2025-11-14 17:52:31,170 - INFO - Going to convert document batch...
2025-11-14 17:52:31,171 - INFO - Processing document 4_2023-02-06
2025-11-14 17:52:31,190 - INFO - Finished converting document 4_2023-02-06 in 0.03 sec.
2025-11-14 17:52:31,235 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:31,236 - ERROR - Input document 4_2023-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:31,237 - INFO - Going to convert document batch...
2025-11-14 17:52:31,248 - IN

Converted 'data\edgar_documents\VZ\4_2023-02-06' --> 'data\processed_data\VZ\4_2023-02-06.md'
Error processing data\edgar_documents\VZ\4_2023-02-13: File format not allowed: data\edgar_documents\VZ\4_2023-02-13
Converted 'data\edgar_documents\VZ\4_2023-02-14' --> 'data\processed_data\VZ\4_2023-02-14.md'
Converted 'data\edgar_documents\VZ\4_2023-02-17' --> 'data\processed_data\VZ\4_2023-02-17.md'


2025-11-14 17:52:31,385 - INFO - Going to convert document batch...
2025-11-14 17:52:31,398 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:31,399 - ERROR - Input document 4_2023-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:31,400 - INFO - Going to convert document batch...
2025-11-14 17:52:31,413 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:31,425 - INFO - Going to convert document batch...
2025-11-14 17:52:31,426 - INFO - P

Error processing data\edgar_documents\VZ\4_2023-02-21: File format not allowed: data\edgar_documents\VZ\4_2023-02-21
Error processing data\edgar_documents\VZ\4_2023-02-27: File format not allowed: data\edgar_documents\VZ\4_2023-02-27
Converted 'data\edgar_documents\VZ\4_2023-03-03' --> 'data\processed_data\VZ\4_2023-03-03.md'


2025-11-14 17:52:31,589 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:31,590 - ERROR - Input document 4_2023-03-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:31,592 - INFO - Going to convert document batch...
2025-11-14 17:52:31,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:31,615 - INFO - Going to convert document batch...
2025-11-14 17:52:31,616 - INFO - Processing document 4_2023-03-15
2025-11-14 17:52:31,634 - INFO - Fin

Converted 'data\edgar_documents\VZ\4_2023-03-06' --> 'data\processed_data\VZ\4_2023-03-06.md'
Error processing data\edgar_documents\VZ\4_2023-03-13: File format not allowed: data\edgar_documents\VZ\4_2023-03-13
Converted 'data\edgar_documents\VZ\4_2023-03-15' --> 'data\processed_data\VZ\4_2023-03-15.md'
Converted 'data\edgar_documents\VZ\4_2023-03-17' --> 'data\processed_data\VZ\4_2023-03-17.md'


2025-11-14 17:52:31,765 - INFO - Processing document 4_2023-03-20
2025-11-14 17:52:31,784 - INFO - Finished converting document 4_2023-03-20 in 0.05 sec.
2025-11-14 17:52:31,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:31,832 - INFO - Going to convert document batch...
2025-11-14 17:52:31,833 - INFO - Processing document 4_2023-03-29
2025-11-14 17:52:31,854 - INFO - Finished converting document 4_2023-03-29 in 0.05 sec.
2025-11-14 17:52:31,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:31,901 - INFO - Going to convert document batch...
2025-11-14 17:52:31,902 - INFO - Processing document 4_2023-04-03
2025-11-14 17:52:31,924 - INFO - Finished converting document 4_2023-04-03 in 0.05 sec.
2025-11-14 17:52:31,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:31,967 - INFO - Going to convert document batch...
2025-11-14 17:52:31,968 - INFO - Processing document 4_2023-04-12
2025-11-14 17:52:31,989 - IN

Converted 'data\edgar_documents\VZ\4_2023-03-20' --> 'data\processed_data\VZ\4_2023-03-20.md'
Converted 'data\edgar_documents\VZ\4_2023-03-29' --> 'data\processed_data\VZ\4_2023-03-29.md'
Converted 'data\edgar_documents\VZ\4_2023-04-03' --> 'data\processed_data\VZ\4_2023-04-03.md'


2025-11-14 17:52:32,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:32,035 - INFO - Going to convert document batch...
2025-11-14 17:52:32,036 - INFO - Processing document 4_2023-04-17
2025-11-14 17:52:32,058 - INFO - Finished converting document 4_2023-04-17 in 0.05 sec.
2025-11-14 17:52:32,098 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:32,099 - ERROR - Input document 4_2023-05-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52

Converted 'data\edgar_documents\VZ\4_2023-04-12' --> 'data\processed_data\VZ\4_2023-04-12.md'
Converted 'data\edgar_documents\VZ\4_2023-04-17' --> 'data\processed_data\VZ\4_2023-04-17.md'
Error processing data\edgar_documents\VZ\4_2023-05-01: File format not allowed: data\edgar_documents\VZ\4_2023-05-01
Converted 'data\edgar_documents\VZ\4_2023-05-03' --> 'data\processed_data\VZ\4_2023-05-03.md'
Error processing data\edgar_documents\VZ\4_2023-05-05: File format not allowed: data\edgar_documents\VZ\4_2023-05-05


2025-11-14 17:52:32,205 - ERROR - Input document 4_2023-05-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:32,208 - INFO - Going to convert document batch...
2025-11-14 17:52:32,218 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:32,219 - ERROR - Input document 4_2023-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\VZ\4_2023-05-08: File format not allowed: data\edgar_documents\VZ\4_2023-05-08
Error processing data\edgar_documents\VZ\4_2023-05-15: File format not allowed: data\edgar_documents\VZ\4_2023-05-15
Error processing data\edgar_documents\VZ\4_2023-05-22: File format not allowed: data\edgar_documents\VZ\4_2023-05-22
Converted 'data\edgar_documents\VZ\4_2023-05-25' --> 'data\processed_data\VZ\4_2023-05-25.md'
Converted 'data\edgar_documents\VZ\4_2023-05-30' --> 'data\processed_data\VZ\4_2023-05-30.md'
Error processing data\edgar_documents\VZ\4_2023-06-05: File format not allowed: data\edgar_documents\VZ\4_2023-06-05


2025-11-14 17:52:32,396 - ERROR - Input document 4_2023-06-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:32,397 - INFO - Going to convert document batch...
2025-11-14 17:52:32,409 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:32,410 - ERROR - Input document 4_2023-06-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\VZ\4_2023-06-12: File format not allowed: data\edgar_documents\VZ\4_2023-06-12
Error processing data\edgar_documents\VZ\4_2023-06-20: File format not allowed: data\edgar_documents\VZ\4_2023-06-20
Error processing data\edgar_documents\VZ\4_2023-06-26: File format not allowed: data\edgar_documents\VZ\4_2023-06-26
Error processing data\edgar_documents\VZ\4_2023-07-03: File format not allowed: data\edgar_documents\VZ\4_2023-07-03
Converted 'data\edgar_documents\VZ\4_2023-07-10' --> 'data\processed_data\VZ\4_2023-07-10.md'
Converted 'data\edgar_documents\VZ\4_2023-07-24' --> 'data\processed_data\VZ\4_2023-07-24.md'


2025-11-14 17:52:32,578 - ERROR - Input document 4_2023-07-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:32,579 - INFO - Going to convert document batch...
2025-11-14 17:52:32,589 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:32,590 - ERROR - Input document 4_2023-08-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\VZ\4_2023-07-31: File format not allowed: data\edgar_documents\VZ\4_2023-07-31
Error processing data\edgar_documents\VZ\4_2023-08-07: File format not allowed: data\edgar_documents\VZ\4_2023-08-07
Error processing data\edgar_documents\VZ\4_2023-08-14: File format not allowed: data\edgar_documents\VZ\4_2023-08-14
Converted 'data\edgar_documents\VZ\4_2023-08-15' --> 'data\processed_data\VZ\4_2023-08-15.md'
Error processing data\edgar_documents\VZ\4_2023-08-21: File format not allowed: data\edgar_documents\VZ\4_2023-08-21
Error processing data\edgar_documents\VZ\4_2023-08-28: File format not allowed: data\edgar_documents\VZ\4_2023-08-28
Error processing data\edgar_documents\VZ\4_2023-09-05: File format not allowed: data\edgar_documents\VZ\4_2023-09-05
Converted 'data\edgar_documents\VZ\4_2023-09-06' --> 'data\processed_data\VZ\4_2023-09-06.md'


2025-11-14 17:52:32,797 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:32,798 - ERROR - Input document 4_2023-09-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:32,799 - INFO - Going to convert document batch...
2025-11-14 17:52:32,811 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:32,812 - ERROR - Input document 4_2023-09-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\VZ\4_2023-09-11: File format not allowed: data\edgar_documents\VZ\4_2023-09-11
Error processing data\edgar_documents\VZ\4_2023-09-18: File format not allowed: data\edgar_documents\VZ\4_2023-09-18
Error processing data\edgar_documents\VZ\4_2023-09-25: File format not allowed: data\edgar_documents\VZ\4_2023-09-25
Error processing data\edgar_documents\VZ\4_2023-10-02: File format not allowed: data\edgar_documents\VZ\4_2023-10-02


2025-11-14 17:52:33,287 - INFO - Finished converting document 4_2023-10-16 in 0.44 sec.
2025-11-14 17:52:33,318 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:33,319 - ERROR - Input document 4_2023-10-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:33,320 - INFO - Going to convert document batch...
2025-11-14 17:52:33,332 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:33,333 - ERROR - Input document 4_2023-11-06 with forma

Converted 'data\edgar_documents\VZ\4_2023-10-16' --> 'data\processed_data\VZ\4_2023-10-16.md'
Error processing data\edgar_documents\VZ\4_2023-10-30: File format not allowed: data\edgar_documents\VZ\4_2023-10-30
Error processing data\edgar_documents\VZ\4_2023-11-06: File format not allowed: data\edgar_documents\VZ\4_2023-11-06
Error processing data\edgar_documents\VZ\4_2023-11-13: File format not allowed: data\edgar_documents\VZ\4_2023-11-13
Error processing data\edgar_documents\VZ\4_2023-11-20: File format not allowed: data\edgar_documents\VZ\4_2023-11-20
Converted 'data\edgar_documents\VZ\4_2023-11-22' --> 'data\processed_data\VZ\4_2023-11-22.md'


2025-11-14 17:52:33,487 - ERROR - Input document 4_2023-11-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:33,488 - INFO - Going to convert document batch...
2025-11-14 17:52:33,501 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:33,502 - ERROR - Input document 4_2023-12-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\VZ\4_2023-11-27: File format not allowed: data\edgar_documents\VZ\4_2023-11-27
Error processing data\edgar_documents\VZ\4_2023-12-04: File format not allowed: data\edgar_documents\VZ\4_2023-12-04
Converted 'data\edgar_documents\VZ\4_2023-12-05' --> 'data\processed_data\VZ\4_2023-12-05.md'
Error processing data\edgar_documents\VZ\4_2023-12-11: File format not allowed: data\edgar_documents\VZ\4_2023-12-11
Converted 'data\edgar_documents\VZ\4_2023-12-13' --> 'data\processed_data\VZ\4_2023-12-13.md'


2025-11-14 17:52:33,695 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:33,696 - ERROR - Input document 4_2023-12-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:33,697 - INFO - Going to convert document batch...
2025-11-14 17:52:33,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:33,712 - INFO - Going to convert document batch...
2025-11-14 17:52:33,713 - INFO - Processing document 4_2023-12-26
2025-11-14 17:52:33,734 - INFO - Fin

Error processing data\edgar_documents\VZ\4_2023-12-18: File format not allowed: data\edgar_documents\VZ\4_2023-12-18
Converted 'data\edgar_documents\VZ\4_2023-12-26' --> 'data\processed_data\VZ\4_2023-12-26.md'
Converted 'data\edgar_documents\VZ\4_2024-01-08' --> 'data\processed_data\VZ\4_2024-01-08.md'
Converted 'data\edgar_documents\VZ\4_2024-01-22' --> 'data\processed_data\VZ\4_2024-01-22.md'


2025-11-14 17:52:33,895 - INFO - Going to convert document batch...
2025-11-14 17:52:33,896 - INFO - Processing document 4_2024-02-05
2025-11-14 17:52:33,915 - INFO - Finished converting document 4_2024-02-05 in 0.03 sec.
2025-11-14 17:52:33,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:33,956 - INFO - Going to convert document batch...
2025-11-14 17:52:33,957 - INFO - Processing document 4_2024-02-06
2025-11-14 17:52:34,001 - INFO - Finished converting document 4_2024-02-06 in 0.06 sec.
2025-11-14 17:52:34,072 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:34,074 - ERROR - Input document 4_2024-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\VZ\4_2024-02-05' --> 'data\processed_data\VZ\4_2024-02-05.md'
Converted 'data\edgar_documents\VZ\4_2024-02-06' --> 'data\processed_data\VZ\4_2024-02-06.md'
Error processing data\edgar_documents\VZ\4_2024-02-14: File format not allowed: data\edgar_documents\VZ\4_2024-02-14


2025-11-14 17:52:34,121 - INFO - Finished converting document 4_2024-02-16 in 0.05 sec.
2025-11-14 17:52:34,159 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:34,160 - ERROR - Input document 4_2024-02-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:34,161 - INFO - Going to convert document batch...
2025-11-14 17:52:34,178 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:34,179 - ERROR - Input document 4_2024-02-21 with forma

Converted 'data\edgar_documents\VZ\4_2024-02-16' --> 'data\processed_data\VZ\4_2024-02-16.md'
Error processing data\edgar_documents\VZ\4_2024-02-20: File format not allowed: data\edgar_documents\VZ\4_2024-02-20
Error processing data\edgar_documents\VZ\4_2024-02-21: File format not allowed: data\edgar_documents\VZ\4_2024-02-21
Error processing data\edgar_documents\VZ\4_2024-02-26: File format not allowed: data\edgar_documents\VZ\4_2024-02-26
Error processing data\edgar_documents\VZ\4_2024-03-04: File format not allowed: data\edgar_documents\VZ\4_2024-03-04
Converted 'data\edgar_documents\VZ\4_2024-03-05' --> 'data\processed_data\VZ\4_2024-03-05.md'
Error processing data\edgar_documents\VZ\4_2024-03-11: File format not allowed: data\edgar_documents\VZ\4_2024-03-11
Error processing data\edgar_documents\VZ\4_2024-03-18: File format not allowed: data\edgar_documents\VZ\4_2024-03-18
Error processing data\edgar_documents\VZ\4_2024-03-25: File format not allowed: data\edgar_documents\VZ\4_2024

2025-11-14 17:52:34,326 - ERROR - Input document 4_2024-04-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:34,327 - INFO - Going to convert document batch...
2025-11-14 17:52:34,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:34,346 - INFO - Going to convert document batch...
2025-11-14 17:52:34,346 - INFO - Processing document 4_2024-04-15
2025-11-14 17:52:34,366 - INFO - Finished converting document 4_2024-04-15 in 0.03 sec.
2025-11-14 17:52:34,412 - INFO - detec

Error processing data\edgar_documents\VZ\4_2024-04-01: File format not allowed: data\edgar_documents\VZ\4_2024-04-01
Converted 'data\edgar_documents\VZ\4_2024-04-15' --> 'data\processed_data\VZ\4_2024-04-15.md'
Error processing data\edgar_documents\VZ\4_2024-04-29: File format not allowed: data\edgar_documents\VZ\4_2024-04-29
Error processing data\edgar_documents\VZ\4_2024-05-06: File format not allowed: data\edgar_documents\VZ\4_2024-05-06
Error processing data\edgar_documents\VZ\4_2024-05-13: File format not allowed: data\edgar_documents\VZ\4_2024-05-13
Error processing data\edgar_documents\VZ\4_2024-05-20: File format not allowed: data\edgar_documents\VZ\4_2024-05-20
Error processing data\edgar_documents\VZ\4_2024-05-28: File format not allowed: data\edgar_documents\VZ\4_2024-05-28
Converted 'data\edgar_documents\VZ\4_2024-05-29' --> 'data\processed_data\VZ\4_2024-05-29.md'


2025-11-14 17:52:34,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:34,566 - INFO - Going to convert document batch...
2025-11-14 17:52:34,568 - INFO - Processing document 4_2024-05-30
2025-11-14 17:52:34,590 - INFO - Finished converting document 4_2024-05-30 in 0.06 sec.
2025-11-14 17:52:34,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:34,632 - INFO - Going to convert document batch...
2025-11-14 17:52:34,633 - INFO - Processing document 4_2024-05-31
2025-11-14 17:52:34,653 - INFO - Finished converting document 4_2024-05-31 in 0.05 sec.
2025-11-14 17:52:34,702 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:34,703 - ERROR - Input document 4_2024-06-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\VZ\4_2024-05-30' --> 'data\processed_data\VZ\4_2024-05-30.md'
Converted 'data\edgar_documents\VZ\4_2024-05-31' --> 'data\processed_data\VZ\4_2024-05-31.md'
Error processing data\edgar_documents\VZ\4_2024-06-03: File format not allowed: data\edgar_documents\VZ\4_2024-06-03
Converted 'data\edgar_documents\VZ\4_2024-06-04' --> 'data\processed_data\VZ\4_2024-06-04.md'
Error processing data\edgar_documents\VZ\4_2024-06-10: File format not allowed: data\edgar_documents\VZ\4_2024-06-10


2025-11-14 17:52:34,797 - ERROR - Input document 4_2024-06-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:34,797 - INFO - Going to convert document batch...
2025-11-14 17:52:34,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:34,818 - INFO - Going to convert document batch...
2025-11-14 17:52:34,819 - INFO - Processing document 4_2024-06-24
2025-11-14 17:52:34,839 - INFO - Finished converting document 4_2024-06-24 in 0.05 sec.
2025-11-14 17:52:34,877 - INFO - detec

Error processing data\edgar_documents\VZ\4_2024-06-17: File format not allowed: data\edgar_documents\VZ\4_2024-06-17
Converted 'data\edgar_documents\VZ\4_2024-06-24' --> 'data\processed_data\VZ\4_2024-06-24.md'
Converted 'data\edgar_documents\VZ\4_2024-07-03' --> 'data\processed_data\VZ\4_2024-07-03.md'
Converted 'data\edgar_documents\VZ\4_2024-07-08' --> 'data\processed_data\VZ\4_2024-07-08.md'


2025-11-14 17:52:35,003 - INFO - Going to convert document batch...
2025-11-14 17:52:35,003 - INFO - Processing document 4_2024-07-22
2025-11-14 17:52:35,024 - INFO - Finished converting document 4_2024-07-22 in 0.03 sec.
2025-11-14 17:52:35,062 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:35,063 - ERROR - Input document 4_2024-07-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:35,064 - INFO - Going to convert document batch...
2025-11-14 17:52:35,076 - IN

Converted 'data\edgar_documents\VZ\4_2024-07-22' --> 'data\processed_data\VZ\4_2024-07-22.md'
Error processing data\edgar_documents\VZ\4_2024-07-29: File format not allowed: data\edgar_documents\VZ\4_2024-07-29
Error processing data\edgar_documents\VZ\4_2024-08-05: File format not allowed: data\edgar_documents\VZ\4_2024-08-05
Error processing data\edgar_documents\VZ\4_2024-08-06: File format not allowed: data\edgar_documents\VZ\4_2024-08-06
Error processing data\edgar_documents\VZ\4_2024-08-12: File format not allowed: data\edgar_documents\VZ\4_2024-08-12
Error processing data\edgar_documents\VZ\4_2024-08-19: File format not allowed: data\edgar_documents\VZ\4_2024-08-19
Error processing data\edgar_documents\VZ\4_2024-08-26: File format not allowed: data\edgar_documents\VZ\4_2024-08-26
Converted 'data\edgar_documents\VZ\4_2024-09-03' --> 'data\processed_data\VZ\4_2024-09-03.md'
Error processing data\edgar_documents\VZ\4_2024-09-10: File format not allowed: data\edgar_documents\VZ\4_2024

2025-11-14 17:52:35,232 - ERROR - Input document 4_2024-09-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:35,233 - INFO - Going to convert document batch...
2025-11-14 17:52:35,245 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:35,245 - ERROR - Input document 4_2024-09-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\VZ\4_2024-09-23: File format not allowed: data\edgar_documents\VZ\4_2024-09-23
Error processing data\edgar_documents\VZ\4_2024-09-30: File format not allowed: data\edgar_documents\VZ\4_2024-09-30
Converted 'data\edgar_documents\VZ\4_2024-10-03' --> 'data\processed_data\VZ\4_2024-10-03.md'
Converted 'data\edgar_documents\VZ\4_2024-10-15' --> 'data\processed_data\VZ\4_2024-10-15.md'


2025-11-14 17:52:35,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:35,446 - INFO - Going to convert document batch...
2025-11-14 17:52:35,447 - INFO - Processing document 4_2024-11-12
2025-11-14 17:52:35,465 - INFO - Finished converting document 4_2024-11-12 in 0.05 sec.
2025-11-14 17:52:35,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:35,509 - INFO - Going to convert document batch...
2025-11-14 17:52:35,510 - INFO - Processing document 4_2024-11-25
2025-11-14 17:52:35,530 - INFO - Finished converting document 4_2024-11-25 in 0.05 sec.
2025-11-14 17:52:35,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:35,570 - INFO - Going to convert document batch...
2025-11-14 17:52:35,571 - INFO - Processing document 4_2024-12-09
2025-11-14 17:52:35,592 - INFO - Finished converting document 4_2024-12-09 in 0.05 sec.


Converted 'data\edgar_documents\VZ\4_2024-10-28' --> 'data\processed_data\VZ\4_2024-10-28.md'
Converted 'data\edgar_documents\VZ\4_2024-11-12' --> 'data\processed_data\VZ\4_2024-11-12.md'
Converted 'data\edgar_documents\VZ\4_2024-11-25' --> 'data\processed_data\VZ\4_2024-11-25.md'


2025-11-14 17:52:35,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:35,630 - INFO - Going to convert document batch...
2025-11-14 17:52:35,630 - INFO - Processing document 4_2024-12-20
2025-11-14 17:52:35,650 - INFO - Finished converting document 4_2024-12-20 in 0.03 sec.
2025-11-14 17:52:35,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:35,722 - INFO - Going to convert document batch...
2025-11-14 17:52:35,723 - INFO - Processing document 4_2025-01-06
2025-11-14 17:52:35,746 - INFO - Finished converting document 4_2025-01-06 in 0.06 sec.
2025-11-14 17:52:35,777 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:35,784 - INFO - Going to convert document batch...
2025-11-14 17:52:35,784 - INFO - Processing document 4_2025-01-17
2025-11-14 17:52:35,804 - INFO - Finished converting document 4_2025-01-17 in 0.03 sec.


Converted 'data\edgar_documents\VZ\4_2024-12-09' --> 'data\processed_data\VZ\4_2024-12-09.md'
Converted 'data\edgar_documents\VZ\4_2024-12-20' --> 'data\processed_data\VZ\4_2024-12-20.md'
Converted 'data\edgar_documents\VZ\4_2025-01-06' --> 'data\processed_data\VZ\4_2025-01-06.md'


2025-11-14 17:52:35,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:35,847 - INFO - Going to convert document batch...
2025-11-14 17:52:35,848 - INFO - Processing document 4_2025-01-29
2025-11-14 17:52:35,866 - INFO - Finished converting document 4_2025-01-29 in 0.03 sec.
2025-11-14 17:52:35,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:35,941 - INFO - Going to convert document batch...
2025-11-14 17:52:35,942 - INFO - Processing document 4_2025-01-30
2025-11-14 17:52:35,969 - INFO - Finished converting document 4_2025-01-30 in 0.06 sec.
2025-11-14 17:52:36,004 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,022 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\VZ\4_2025-01-17' --> 'data\processed_data\VZ\4_2025-01-17.md'
Converted 'data\edgar_documents\VZ\4_2025-01-29' --> 'data\processed_data\VZ\4_2025-01-29.md'
Converted 'data\edgar_documents\VZ\4_2025-01-30' --> 'data\processed_data\VZ\4_2025-01-30.md'


2025-11-14 17:52:36,024 - INFO - Processing document 4_2025-01-31
2025-11-14 17:52:36,044 - INFO - Finished converting document 4_2025-01-31 in 0.06 sec.
2025-11-14 17:52:36,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,092 - INFO - Going to convert document batch...
2025-11-14 17:52:36,093 - INFO - Processing document 4_2025-02-03
2025-11-14 17:52:36,112 - INFO - Finished converting document 4_2025-02-03 in 0.05 sec.
2025-11-14 17:52:36,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,151 - INFO - Going to convert document batch...
2025-11-14 17:52:36,151 - INFO - Processing document 4_2025-02-05
2025-11-14 17:52:36,168 - INFO - Finished converting document 4_2025-02-05 in 0.05 sec.
2025-11-14 17:52:36,215 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,231 - INFO - Going to convert document batch...
2025-11-14 17:52:36,233 - INFO - Processing document 4_2025-02-06


Converted 'data\edgar_documents\VZ\4_2025-01-31' --> 'data\processed_data\VZ\4_2025-01-31.md'
Converted 'data\edgar_documents\VZ\4_2025-02-03' --> 'data\processed_data\VZ\4_2025-02-03.md'
Converted 'data\edgar_documents\VZ\4_2025-02-05' --> 'data\processed_data\VZ\4_2025-02-05.md'


2025-11-14 17:52:36,252 - INFO - Finished converting document 4_2025-02-06 in 0.06 sec.
2025-11-14 17:52:36,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,291 - INFO - Going to convert document batch...
2025-11-14 17:52:36,291 - INFO - Processing document 4_2025-02-14
2025-11-14 17:52:36,323 - INFO - Finished converting document 4_2025-02-14 in 0.06 sec.
2025-11-14 17:52:36,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,376 - INFO - Going to convert document batch...
2025-11-14 17:52:36,377 - INFO - Processing document 4_2025-02-27
2025-11-14 17:52:36,396 - INFO - Finished converting document 4_2025-02-27 in 0.03 sec.
2025-11-14 17:52:36,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,454 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\VZ\4_2025-02-06' --> 'data\processed_data\VZ\4_2025-02-06.md'
Converted 'data\edgar_documents\VZ\4_2025-02-14' --> 'data\processed_data\VZ\4_2025-02-14.md'
Converted 'data\edgar_documents\VZ\4_2025-02-27' --> 'data\processed_data\VZ\4_2025-02-27.md'


2025-11-14 17:52:36,455 - INFO - Processing document 4_2025-02-28
2025-11-14 17:52:36,475 - INFO - Finished converting document 4_2025-02-28 in 0.05 sec.
2025-11-14 17:52:36,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,525 - INFO - Going to convert document batch...
2025-11-14 17:52:36,526 - INFO - Processing document 4_2025-03-04
2025-11-14 17:52:36,557 - INFO - Finished converting document 4_2025-03-04 in 0.06 sec.
2025-11-14 17:52:36,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,614 - INFO - Going to convert document batch...
2025-11-14 17:52:36,615 - INFO - Processing document 4_2025-03-14
2025-11-14 17:52:36,633 - INFO - Finished converting document 4_2025-03-14 in 0.05 sec.
2025-11-14 17:52:36,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,672 - INFO - Going to convert document batch...
2025-11-14 17:52:36,672 - INFO - Processing document 4_2025-03-20
2025-11-14 17:52:36,690 - IN

Converted 'data\edgar_documents\VZ\4_2025-02-28' --> 'data\processed_data\VZ\4_2025-02-28.md'
Converted 'data\edgar_documents\VZ\4_2025-03-04' --> 'data\processed_data\VZ\4_2025-03-04.md'
Converted 'data\edgar_documents\VZ\4_2025-03-14' --> 'data\processed_data\VZ\4_2025-03-14.md'


2025-11-14 17:52:36,725 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:36,725 - ERROR - Input document 4_2025-03-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:36,727 - INFO - Going to convert document batch...
2025-11-14 17:52:36,741 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:36,742 - ERROR - Input document 4_2025-03-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\VZ\4_2025-03-20' --> 'data\processed_data\VZ\4_2025-03-20.md'
Error processing data\edgar_documents\VZ\4_2025-03-24: File format not allowed: data\edgar_documents\VZ\4_2025-03-24
Error processing data\edgar_documents\VZ\4_2025-03-26: File format not allowed: data\edgar_documents\VZ\4_2025-03-26
Converted 'data\edgar_documents\VZ\4_2025-03-28' --> 'data\processed_data\VZ\4_2025-03-28.md'
Error processing data\edgar_documents\VZ\4_2025-04-08: File format not allowed: data\edgar_documents\VZ\4_2025-04-08


2025-11-14 17:52:36,895 - INFO - Finished converting document 4_2025-04-11 in 0.05 sec.
2025-11-14 17:52:36,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,935 - INFO - Going to convert document batch...
2025-11-14 17:52:36,936 - INFO - Processing document 4_2025-04-24
2025-11-14 17:52:36,955 - INFO - Finished converting document 4_2025-04-24 in 0.03 sec.
2025-11-14 17:52:36,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:36,998 - INFO - Going to convert document batch...
2025-11-14 17:52:36,999 - INFO - Processing document 4_2025-04-25
2025-11-14 17:52:37,018 - INFO - Finished converting document 4_2025-04-25 in 0.05 sec.
2025-11-14 17:52:37,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,061 - INFO - Going to convert document batch...
2025-11-14 17:52:37,062 - INFO - Processing document 4_2025-05-01
2025-11-14 17:52:37,082 - INFO - Finished converting document 4_2025-05-01 in 0.05 sec.
2025-1

Converted 'data\edgar_documents\VZ\4_2025-04-11' --> 'data\processed_data\VZ\4_2025-04-11.md'
Converted 'data\edgar_documents\VZ\4_2025-04-24' --> 'data\processed_data\VZ\4_2025-04-24.md'
Converted 'data\edgar_documents\VZ\4_2025-04-25' --> 'data\processed_data\VZ\4_2025-04-25.md'
Converted 'data\edgar_documents\VZ\4_2025-05-01' --> 'data\processed_data\VZ\4_2025-05-01.md'


2025-11-14 17:52:37,120 - INFO - Going to convert document batch...
2025-11-14 17:52:37,120 - INFO - Processing document 4_2025-05-08
2025-11-14 17:52:37,139 - INFO - Finished converting document 4_2025-05-08 in 0.05 sec.
2025-11-14 17:52:37,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,182 - INFO - Going to convert document batch...
2025-11-14 17:52:37,183 - INFO - Processing document 4_2025-05-09
2025-11-14 17:52:37,205 - INFO - Finished converting document 4_2025-05-09 in 0.05 sec.
2025-11-14 17:52:37,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,244 - INFO - Going to convert document batch...
2025-11-14 17:52:37,245 - INFO - Processing document 4_2025-05-23
2025-11-14 17:52:37,262 - INFO - Finished converting document 4_2025-05-23 in 0.05 sec.
2025-11-14 17:52:37,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,304 - INFO - Going to convert document batch...
2025-11-14 17:52:37,305 - 

Converted 'data\edgar_documents\VZ\4_2025-05-08' --> 'data\processed_data\VZ\4_2025-05-08.md'
Converted 'data\edgar_documents\VZ\4_2025-05-09' --> 'data\processed_data\VZ\4_2025-05-09.md'
Converted 'data\edgar_documents\VZ\4_2025-05-23' --> 'data\processed_data\VZ\4_2025-05-23.md'


2025-11-14 17:52:37,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,368 - INFO - Going to convert document batch...
2025-11-14 17:52:37,369 - INFO - Processing document 4_2025-06-09
2025-11-14 17:52:37,389 - INFO - Finished converting document 4_2025-06-09 in 0.05 sec.
2025-11-14 17:52:37,422 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,432 - INFO - Going to convert document batch...
2025-11-14 17:52:37,432 - INFO - Processing document 4_2025-06-20
2025-11-14 17:52:37,462 - INFO - Finished converting document 4_2025-06-20 in 0.05 sec.
2025-11-14 17:52:37,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,516 - INFO - Going to convert document batch...
2025-11-14 17:52:37,517 - INFO - Processing document 4_2025-07-07


Converted 'data\edgar_documents\VZ\4_2025-05-28' --> 'data\processed_data\VZ\4_2025-05-28.md'
Converted 'data\edgar_documents\VZ\4_2025-06-09' --> 'data\processed_data\VZ\4_2025-06-09.md'
Converted 'data\edgar_documents\VZ\4_2025-06-20' --> 'data\processed_data\VZ\4_2025-06-20.md'


2025-11-14 17:52:37,540 - INFO - Finished converting document 4_2025-07-07 in 0.05 sec.
2025-11-14 17:52:37,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,581 - INFO - Going to convert document batch...
2025-11-14 17:52:37,581 - INFO - Processing document 4_2025-07-18
2025-11-14 17:52:37,603 - INFO - Finished converting document 4_2025-07-18 in 0.03 sec.
2025-11-14 17:52:37,647 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:37,648 - ERROR - Input document 4_2025-07-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\VZ\4_2025-07-07' --> 'data\processed_data\VZ\4_2025-07-07.md'
Converted 'data\edgar_documents\VZ\4_2025-07-18' --> 'data\processed_data\VZ\4_2025-07-18.md'
Error processing data\edgar_documents\VZ\4_2025-07-30: File format not allowed: data\edgar_documents\VZ\4_2025-07-30
Converted 'data\edgar_documents\VZ\4_2025-08-01' --> 'data\processed_data\VZ\4_2025-08-01.md'


2025-11-14 17:52:37,760 - INFO - Going to convert document batch...
2025-11-14 17:52:37,761 - INFO - Processing document 4_2025-08-15
2025-11-14 17:52:37,783 - INFO - Finished converting document 4_2025-08-15 in 0.06 sec.
2025-11-14 17:52:37,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,845 - INFO - Going to convert document batch...
2025-11-14 17:52:37,847 - INFO - Processing document 4_2025-08-20
2025-11-14 17:52:37,876 - INFO - Finished converting document 4_2025-08-20 in 0.06 sec.
2025-11-14 17:52:37,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,931 - INFO - Going to convert document batch...
2025-11-14 17:52:37,932 - INFO - Processing document 4_2025-08-26
2025-11-14 17:52:37,955 - INFO - Finished converting document 4_2025-08-26 in 0.05 sec.
2025-11-14 17:52:37,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:37,998 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\VZ\4_2025-08-15' --> 'data\processed_data\VZ\4_2025-08-15.md'
Converted 'data\edgar_documents\VZ\4_2025-08-20' --> 'data\processed_data\VZ\4_2025-08-20.md'
Converted 'data\edgar_documents\VZ\4_2025-08-26' --> 'data\processed_data\VZ\4_2025-08-26.md'


2025-11-14 17:52:37,999 - INFO - Processing document 4_2025-08-29
2025-11-14 17:52:38,019 - INFO - Finished converting document 4_2025-08-29 in 0.03 sec.
2025-11-14 17:52:38,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:38,064 - INFO - Going to convert document batch...
2025-11-14 17:52:38,064 - INFO - Processing document 4_2025-09-12
2025-11-14 17:52:38,085 - INFO - Finished converting document 4_2025-09-12 in 0.03 sec.
2025-11-14 17:52:38,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:38,131 - INFO - Going to convert document batch...
2025-11-14 17:52:38,132 - INFO - Processing document 4_2025-09-26
2025-11-14 17:52:38,155 - INFO - Finished converting document 4_2025-09-26 in 0.05 sec.
2025-11-14 17:52:38,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:38,202 - INFO - Going to convert document batch...
2025-11-14 17:52:38,203 - INFO - Processing document 4_2025-10-10
2025-11-14 17:52:38,222 - IN

Converted 'data\edgar_documents\VZ\4_2025-08-29' --> 'data\processed_data\VZ\4_2025-08-29.md'
Converted 'data\edgar_documents\VZ\4_2025-09-12' --> 'data\processed_data\VZ\4_2025-09-12.md'
Converted 'data\edgar_documents\VZ\4_2025-09-26' --> 'data\processed_data\VZ\4_2025-09-26.md'


2025-11-14 17:52:38,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:38,262 - INFO - Going to convert document batch...
2025-11-14 17:52:38,263 - INFO - Processing document 4_2025-10-20
2025-11-14 17:52:38,282 - INFO - Finished converting document 4_2025-10-20 in 0.05 sec.
2025-11-14 17:52:38,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:38,326 - INFO - Going to convert document batch...
2025-11-14 17:52:38,327 - INFO - Processing document 4_2025-10-21
2025-11-14 17:52:38,551 - INFO - Finished converting document 4_2025-10-21 in 0.25 sec.


Converted 'data\edgar_documents\VZ\4_2025-10-10' --> 'data\processed_data\VZ\4_2025-10-10.md'
Converted 'data\edgar_documents\VZ\4_2025-10-20' --> 'data\processed_data\VZ\4_2025-10-20.md'


2025-11-14 17:52:38,601 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:38,609 - INFO - Going to convert document batch...
2025-11-14 17:52:38,610 - INFO - Processing document 4_2025-10-24
2025-11-14 17:52:38,630 - INFO - Finished converting document 4_2025-10-24 in 0.05 sec.
2025-11-14 17:52:38,677 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:38,678 - ERROR - Input document 4_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52

Converted 'data\edgar_documents\VZ\4_2025-10-21' --> 'data\processed_data\VZ\4_2025-10-21.md'
Converted 'data\edgar_documents\VZ\4_2025-10-24' --> 'data\processed_data\VZ\4_2025-10-24.md'
Error processing data\edgar_documents\VZ\4_2025-11-03: File format not allowed: data\edgar_documents\VZ\4_2025-11-03
Error processing data\edgar_documents\VZ\4_2025-11-06: File format not allowed: data\edgar_documents\VZ\4_2025-11-06


2025-11-14 17:52:38,810 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:38,811 - ERROR - Input document 4_2025-11-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:38,813 - INFO - Going to convert document batch...
2025-11-14 17:52:38,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:38,869 - INFO - Going to convert document batch...
2025-11-14 17:52:38,869 - INFO - Processing document 8-K_2023-01-24
2025-11-14 17:52:38,924 - INFO - F

Converted 'data\edgar_documents\VZ\4_2025-11-07' --> 'data\processed_data\VZ\4_2025-11-07.md'
Error processing data\edgar_documents\VZ\4_2025-11-10: File format not allowed: data\edgar_documents\VZ\4_2025-11-10
Converted 'data\edgar_documents\VZ\8-K_2023-01-24' --> 'data\processed_data\VZ\8-K_2023-01-24.md'


2025-11-14 17:52:38,992 - INFO - Processing document 8-K_2023-03-03
2025-11-14 17:52:39,025 - INFO - Finished converting document 8-K_2023-03-03 in 0.06 sec.
2025-11-14 17:52:39,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:39,086 - INFO - Going to convert document batch...
2025-11-14 17:52:39,087 - INFO - Processing document 8-K_2023-04-25
2025-11-14 17:52:39,157 - INFO - Finished converting document 8-K_2023-04-25 in 0.12 sec.
2025-11-14 17:52:39,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:39,227 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\VZ\8-K_2023-03-03' --> 'data\processed_data\VZ\8-K_2023-03-03.md'
Converted 'data\edgar_documents\VZ\8-K_2023-04-25' --> 'data\processed_data\VZ\8-K_2023-04-25.md'


2025-11-14 17:52:39,228 - INFO - Processing document 8-K_2023-05-16
2025-11-14 17:52:39,279 - INFO - Finished converting document 8-K_2023-05-16 in 0.09 sec.
2025-11-14 17:52:39,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:39,345 - INFO - Going to convert document batch...
2025-11-14 17:52:39,346 - INFO - Processing document 8-K_2023-07-25
2025-11-14 17:52:39,390 - INFO - Finished converting document 8-K_2023-07-25 in 0.09 sec.
2025-11-14 17:52:39,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:39,452 - INFO - Going to convert document batch...
2025-11-14 17:52:39,453 - INFO - Processing document 8-K_2023-08-10
2025-11-14 17:52:39,483 - INFO - Finished converting document 8-K_2023-08-10 in 0.08 sec.


Converted 'data\edgar_documents\VZ\8-K_2023-05-16' --> 'data\processed_data\VZ\8-K_2023-05-16.md'
Converted 'data\edgar_documents\VZ\8-K_2023-07-25' --> 'data\processed_data\VZ\8-K_2023-07-25.md'


2025-11-14 17:52:39,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:39,538 - INFO - Going to convert document batch...
2025-11-14 17:52:39,539 - INFO - Processing document 8-K_2023-10-24
2025-11-14 17:52:39,583 - INFO - Finished converting document 8-K_2023-10-24 in 0.08 sec.
2025-11-14 17:52:39,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:39,645 - INFO - Going to convert document batch...
2025-11-14 17:52:39,646 - INFO - Processing document 8-K_2024-01-17
2025-11-14 17:52:39,677 - INFO - Finished converting document 8-K_2024-01-17 in 0.06 sec.
2025-11-14 17:52:39,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\8-K_2023-08-10' --> 'data\processed_data\VZ\8-K_2023-08-10.md'
Converted 'data\edgar_documents\VZ\8-K_2023-10-24' --> 'data\processed_data\VZ\8-K_2023-10-24.md'
Converted 'data\edgar_documents\VZ\8-K_2024-01-17' --> 'data\processed_data\VZ\8-K_2024-01-17.md'


2025-11-14 17:52:39,733 - INFO - Going to convert document batch...
2025-11-14 17:52:39,734 - INFO - Processing document 8-K_2024-01-23
2025-11-14 17:52:39,776 - INFO - Finished converting document 8-K_2024-01-23 in 0.09 sec.
2025-11-14 17:52:39,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:39,838 - INFO - Going to convert document batch...
2025-11-14 17:52:39,839 - INFO - Processing document 8-K_2024-01-24
2025-11-14 17:52:39,898 - INFO - Finished converting document 8-K_2024-01-24 in 0.09 sec.
2025-11-14 17:52:39,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:39,982 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\VZ\8-K_2024-01-23' --> 'data\processed_data\VZ\8-K_2024-01-23.md'
Converted 'data\edgar_documents\VZ\8-K_2024-01-24' --> 'data\processed_data\VZ\8-K_2024-01-24.md'


2025-11-14 17:52:39,983 - INFO - Processing document 8-K_2024-02-02
2025-11-14 17:52:40,015 - INFO - Finished converting document 8-K_2024-02-02 in 0.09 sec.
2025-11-14 17:52:40,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:40,063 - INFO - Going to convert document batch...
2025-11-14 17:52:40,064 - INFO - Processing document 8-K_2024-03-06
2025-11-14 17:52:40,097 - INFO - Finished converting document 8-K_2024-03-06 in 0.06 sec.
2025-11-14 17:52:40,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:40,180 - INFO - Going to convert document batch...
2025-11-14 17:52:40,182 - INFO - Processing document 8-K_2024-04-22
2025-11-14 17:52:40,222 - INFO - Finished converting document 8-K_2024-04-22 in 0.11 sec.


Converted 'data\edgar_documents\VZ\8-K_2024-02-02' --> 'data\processed_data\VZ\8-K_2024-02-02.md'
Converted 'data\edgar_documents\VZ\8-K_2024-03-06' --> 'data\processed_data\VZ\8-K_2024-03-06.md'


2025-11-14 17:52:40,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:40,290 - INFO - Going to convert document batch...
2025-11-14 17:52:40,291 - INFO - Processing document 8-K_2024-05-13
2025-11-14 17:52:40,333 - INFO - Finished converting document 8-K_2024-05-13 in 0.09 sec.
2025-11-14 17:52:40,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:40,406 - INFO - Going to convert document batch...
2025-11-14 17:52:40,408 - INFO - Processing document 8-K_2024-05-23
2025-11-14 17:52:40,451 - INFO - Finished converting document 8-K_2024-05-23 in 0.11 sec.


Converted 'data\edgar_documents\VZ\8-K_2024-04-22' --> 'data\processed_data\VZ\8-K_2024-04-22.md'
Converted 'data\edgar_documents\VZ\8-K_2024-05-13' --> 'data\processed_data\VZ\8-K_2024-05-13.md'


2025-11-14 17:52:40,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:40,500 - INFO - Going to convert document batch...
2025-11-14 17:52:40,500 - INFO - Processing document 8-K_2024-06-27
2025-11-14 17:52:40,533 - INFO - Finished converting document 8-K_2024-06-27 in 0.08 sec.
2025-11-14 17:52:40,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:40,605 - INFO - Going to convert document batch...
2025-11-14 17:52:40,606 - INFO - Processing document 8-K_2024-07-22
2025-11-14 17:52:40,644 - INFO - Finished converting document 8-K_2024-07-22 in 0.09 sec.


Converted 'data\edgar_documents\VZ\8-K_2024-05-23' --> 'data\processed_data\VZ\8-K_2024-05-23.md'
Converted 'data\edgar_documents\VZ\8-K_2024-06-27' --> 'data\processed_data\VZ\8-K_2024-06-27.md'


2025-11-14 17:52:40,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:40,694 - INFO - Going to convert document batch...
2025-11-14 17:52:40,695 - INFO - Processing document 8-K_2024-07-31
2025-11-14 17:52:40,729 - INFO - Finished converting document 8-K_2024-07-31 in 0.08 sec.
2025-11-14 17:52:40,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:40,780 - INFO - Going to convert document batch...
2025-11-14 17:52:40,781 - INFO - Processing document 8-K_2024-08-05
2025-11-14 17:52:40,810 - INFO - Finished converting document 8-K_2024-08-05 in 0.08 sec.
2025-11-14 17:52:40,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\8-K_2024-07-22' --> 'data\processed_data\VZ\8-K_2024-07-22.md'
Converted 'data\edgar_documents\VZ\8-K_2024-07-31' --> 'data\processed_data\VZ\8-K_2024-07-31.md'
Converted 'data\edgar_documents\VZ\8-K_2024-08-05' --> 'data\processed_data\VZ\8-K_2024-08-05.md'


2025-11-14 17:52:40,862 - INFO - Going to convert document batch...
2025-11-14 17:52:40,862 - INFO - Processing document 8-K_2024-08-20
2025-11-14 17:52:40,892 - INFO - Finished converting document 8-K_2024-08-20 in 0.06 sec.
2025-11-14 17:52:40,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:40,945 - INFO - Going to convert document batch...
2025-11-14 17:52:40,946 - INFO - Processing document 8-K_2024-09-05
2025-11-14 17:52:40,994 - INFO - Finished converting document 8-K_2024-09-05 in 0.08 sec.
2025-11-14 17:52:41,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\8-K_2024-08-20' --> 'data\processed_data\VZ\8-K_2024-08-20.md'
Converted 'data\edgar_documents\VZ\8-K_2024-09-05' --> 'data\processed_data\VZ\8-K_2024-09-05.md'


2025-11-14 17:52:41,271 - INFO - Going to convert document batch...
2025-11-14 17:52:41,272 - INFO - Processing document 8-K_2024-09-09
2025-11-14 17:52:41,307 - INFO - Finished converting document 8-K_2024-09-09 in 0.30 sec.
2025-11-14 17:52:41,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:41,359 - INFO - Going to convert document batch...
2025-11-14 17:52:41,361 - INFO - Processing document 8-K_2024-09-12
2025-11-14 17:52:41,392 - INFO - Finished converting document 8-K_2024-09-12 in 0.06 sec.
2025-11-14 17:52:41,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:41,447 - INFO - Going to convert document batch...
2025-11-14 17:52:41,448 - INFO - Processing document 8-K_2024-09-30
2025-11-14 17:52:41,480 - INFO - Finished converting document 8-K_2024-09-30 in 0.08 sec.
2025-11-14 17:52:41,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:41,529 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\VZ\8-K_2024-09-09' --> 'data\processed_data\VZ\8-K_2024-09-09.md'
Converted 'data\edgar_documents\VZ\8-K_2024-09-12' --> 'data\processed_data\VZ\8-K_2024-09-12.md'
Converted 'data\edgar_documents\VZ\8-K_2024-09-30' --> 'data\processed_data\VZ\8-K_2024-09-30.md'


2025-11-14 17:52:41,530 - INFO - Processing document 8-K_2024-10-22
2025-11-14 17:52:41,568 - INFO - Finished converting document 8-K_2024-10-22 in 0.08 sec.
2025-11-14 17:52:41,605 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:41,632 - INFO - Going to convert document batch...
2025-11-14 17:52:41,632 - INFO - Processing document 8-K_2024-12-06
2025-11-14 17:52:41,668 - INFO - Finished converting document 8-K_2024-12-06 in 0.08 sec.
2025-11-14 17:52:41,698 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:41,738 - INFO - Going to convert document batch...
2025-11-14 17:52:41,739 - INFO - Processing document 8-K_2025-01-24
2025-11-14 17:52:41,785 - INFO - Finished converting document 8-K_2025-01-24 in 0.11 sec.


Converted 'data\edgar_documents\VZ\8-K_2024-10-22' --> 'data\processed_data\VZ\8-K_2024-10-22.md'
Converted 'data\edgar_documents\VZ\8-K_2024-12-06' --> 'data\processed_data\VZ\8-K_2024-12-06.md'


2025-11-14 17:52:41,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:41,847 - INFO - Going to convert document batch...
2025-11-14 17:52:41,848 - INFO - Processing document 8-K_2025-02-10
2025-11-14 17:52:41,881 - INFO - Finished converting document 8-K_2025-02-10 in 0.06 sec.
2025-11-14 17:52:41,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:41,930 - INFO - Going to convert document batch...
2025-11-14 17:52:41,931 - INFO - Processing document 8-K_2025-03-11
2025-11-14 17:52:41,966 - INFO - Finished converting document 8-K_2025-03-11 in 0.08 sec.
2025-11-14 17:52:41,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\8-K_2025-01-24' --> 'data\processed_data\VZ\8-K_2025-01-24.md'
Converted 'data\edgar_documents\VZ\8-K_2025-02-10' --> 'data\processed_data\VZ\8-K_2025-02-10.md'
Converted 'data\edgar_documents\VZ\8-K_2025-03-11' --> 'data\processed_data\VZ\8-K_2025-03-11.md'


2025-11-14 17:52:42,021 - INFO - Going to convert document batch...
2025-11-14 17:52:42,022 - INFO - Processing document 8-K_2025-03-19
2025-11-14 17:52:42,082 - INFO - Finished converting document 8-K_2025-03-19 in 0.09 sec.
2025-11-14 17:52:42,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:42,154 - INFO - Going to convert document batch...
2025-11-14 17:52:42,155 - INFO - Processing document 8-K_2025-04-22
2025-11-14 17:52:42,210 - INFO - Finished converting document 8-K_2025-04-22 in 0.09 sec.
2025-11-14 17:52:42,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:42,279 - INFO - Going to convert document batch...
2025-11-14 17:52:42,280 - INFO - Processing document 8-K_2025-05-28


Converted 'data\edgar_documents\VZ\8-K_2025-03-19' --> 'data\processed_data\VZ\8-K_2025-03-19.md'
Converted 'data\edgar_documents\VZ\8-K_2025-04-22' --> 'data\processed_data\VZ\8-K_2025-04-22.md'


2025-11-14 17:52:42,322 - INFO - Finished converting document 8-K_2025-05-28 in 0.08 sec.
2025-11-14 17:52:42,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:42,375 - INFO - Going to convert document batch...
2025-11-14 17:52:42,376 - INFO - Processing document 8-K_2025-06-12
2025-11-14 17:52:42,409 - INFO - Finished converting document 8-K_2025-06-12 in 0.08 sec.
2025-11-14 17:52:42,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:42,462 - INFO - Going to convert document batch...
2025-11-14 17:52:42,463 - INFO - Processing document 8-K_2025-06-18
2025-11-14 17:52:42,498 - INFO - Finished converting document 8-K_2025-06-18 in 0.08 sec.
2025-11-14 17:52:42,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\8-K_2025-05-28' --> 'data\processed_data\VZ\8-K_2025-05-28.md'
Converted 'data\edgar_documents\VZ\8-K_2025-06-12' --> 'data\processed_data\VZ\8-K_2025-06-12.md'
Converted 'data\edgar_documents\VZ\8-K_2025-06-18' --> 'data\processed_data\VZ\8-K_2025-06-18.md'


2025-11-14 17:52:42,548 - INFO - Going to convert document batch...
2025-11-14 17:52:42,549 - INFO - Processing document 8-K_2025-06-20
2025-11-14 17:52:42,587 - INFO - Finished converting document 8-K_2025-06-20 in 0.06 sec.
2025-11-14 17:52:42,617 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:42,668 - INFO - Going to convert document batch...
2025-11-14 17:52:42,671 - INFO - Processing document 8-K_2025-06-23
2025-11-14 17:52:42,708 - INFO - Finished converting document 8-K_2025-06-23 in 0.11 sec.
2025-11-14 17:52:42,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:42,791 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\VZ\8-K_2025-06-20' --> 'data\processed_data\VZ\8-K_2025-06-20.md'
Converted 'data\edgar_documents\VZ\8-K_2025-06-23' --> 'data\processed_data\VZ\8-K_2025-06-23.md'


2025-11-14 17:52:42,793 - INFO - Processing document 8-K_2025-06-27
2025-11-14 17:52:42,826 - INFO - Finished converting document 8-K_2025-06-27 in 0.11 sec.
2025-11-14 17:52:42,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:42,889 - INFO - Going to convert document batch...
2025-11-14 17:52:42,891 - INFO - Processing document 8-K_2025-07-21
2025-11-14 17:52:42,938 - INFO - Finished converting document 8-K_2025-07-21 in 0.09 sec.
2025-11-14 17:52:42,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:43,002 - INFO - Going to convert document batch...
2025-11-14 17:52:43,003 - INFO - Processing document 8-K_2025-08-25
2025-11-14 17:52:43,036 - INFO - Finished converting document 8-K_2025-08-25 in 0.08 sec.


Converted 'data\edgar_documents\VZ\8-K_2025-06-27' --> 'data\processed_data\VZ\8-K_2025-06-27.md'
Converted 'data\edgar_documents\VZ\8-K_2025-07-21' --> 'data\processed_data\VZ\8-K_2025-07-21.md'


2025-11-14 17:52:43,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:43,089 - INFO - Going to convert document batch...
2025-11-14 17:52:43,090 - INFO - Processing document 8-K_2025-10-06
2025-11-14 17:52:43,126 - INFO - Finished converting document 8-K_2025-10-06 in 0.08 sec.
2025-11-14 17:52:43,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:43,181 - INFO - Going to convert document batch...
2025-11-14 17:52:43,182 - INFO - Processing document 8-K_2025-10-14
2025-11-14 17:52:43,216 - INFO - Finished converting document 8-K_2025-10-14 in 0.08 sec.


Converted 'data\edgar_documents\VZ\8-K_2025-08-25' --> 'data\processed_data\VZ\8-K_2025-08-25.md'
Converted 'data\edgar_documents\VZ\8-K_2025-10-06' --> 'data\processed_data\VZ\8-K_2025-10-06.md'


2025-11-14 17:52:43,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:52:43,270 - INFO - Going to convert document batch...
2025-11-14 17:52:43,271 - INFO - Processing document 8-K_2025-10-29
2025-11-14 17:52:43,345 - INFO - Finished converting document 8-K_2025-10-29 in 0.11 sec.
2025-11-14 17:52:43,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\8-K_2025-10-14' --> 'data\processed_data\VZ\8-K_2025-10-14.md'
Converted 'data\edgar_documents\VZ\8-K_2025-10-29' --> 'data\processed_data\VZ\8-K_2025-10-29.md'


2025-11-14 17:52:43,458 - INFO - Going to convert document batch...
2025-11-14 17:52:43,459 - INFO - Processing document 8-K_2025-11-10
2025-11-14 17:52:43,509 - INFO - Finished converting document 8-K_2025-11-10 in 0.11 sec.
2025-11-14 17:52:43,582 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:52:43,582 - ERROR - Input document DEF-14A_2023-03-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:52:43,586 - INFO - Going to convert 

Converted 'data\edgar_documents\VZ\8-K_2025-11-10' --> 'data\processed_data\VZ\8-K_2025-11-10.md'
Error processing data\edgar_documents\VZ\DEF-14A_2023-03-27: File format not allowed: data\edgar_documents\VZ\DEF-14A_2023-03-27


2025-11-14 17:52:44,380 - INFO - Going to convert document batch...
2025-11-14 17:52:44,381 - INFO - Processing document DEF-14A_2024-03-25
2025-11-14 17:52:46,230 - INFO - Finished converting document DEF-14A_2024-03-25 in 2.66 sec.
2025-11-14 17:52:47,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\DEF-14A_2024-03-25' --> 'data\processed_data\VZ\DEF-14A_2024-03-25.md'


2025-11-14 17:52:47,868 - INFO - Going to convert document batch...
2025-11-14 17:52:47,869 - INFO - Processing document DEF-14A_2025-04-07
2025-11-14 17:53:04,866 - INFO - Finished converting document DEF-14A_2025-04-07 in 17.58 sec.
2025-11-14 17:53:05,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\VZ\DEF-14A_2025-04-07' --> 'data\processed_data\VZ\DEF-14A_2025-04-07.md'
Processed 146 new files. Errors: 67
Found 323 files to process in data\edgar_documents\WFC


2025-11-14 17:53:06,904 - INFO - Going to convert document batch...
2025-11-14 17:53:06,905 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:53:06,906 - INFO - Processing document 10-K_2023-02-21
2025-11-14 17:53:07,550 - INFO - Finished converting document 10-K_2023-02-21 in 1.66 sec.
2025-11-14 17:53:08,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WFC\10-K_2023-02-21' --> 'data\processed_data\WFC\10-K_2023-02-21.md'


2025-11-14 17:53:08,552 - INFO - Going to convert document batch...
2025-11-14 17:53:08,553 - INFO - Processing document 10-K_2024-02-20
2025-11-14 17:53:09,364 - INFO - Finished converting document 10-K_2024-02-20 in 1.34 sec.
2025-11-14 17:53:09,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WFC\10-K_2024-02-20' --> 'data\processed_data\WFC\10-K_2024-02-20.md'


2025-11-14 17:53:10,259 - INFO - Going to convert document batch...
2025-11-14 17:53:10,260 - INFO - Processing document 10-K_2025-02-25
2025-11-14 17:53:10,770 - INFO - Finished converting document 10-K_2025-02-25 in 0.98 sec.


Converted 'data\edgar_documents\WFC\10-K_2025-02-25' --> 'data\processed_data\WFC\10-K_2025-02-25.md'


2025-11-14 17:53:11,456 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:53:14,780 - INFO - Going to convert document batch...
2025-11-14 17:53:14,780 - INFO - Processing document 10-Q_2023-05-02
2025-11-14 17:53:20,565 - INFO - Finished converting document 10-Q_2023-05-02 in 9.33 sec.


Converted 'data\edgar_documents\WFC\10-Q_2023-05-02' --> 'data\processed_data\WFC\10-Q_2023-05-02.md'


2025-11-14 17:53:23,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:53:26,944 - INFO - Going to convert document batch...
2025-11-14 17:53:26,944 - INFO - Processing document 10-Q_2023-08-01
2025-11-14 17:53:35,653 - INFO - Finished converting document 10-Q_2023-08-01 in 12.88 sec.
2025-11-14 17:53:38,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:53:38,526 - INFO - Going to convert document batch...
2025-11-14 17:53:38,527 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 17:53:38,556 - INFO - Finished converting document 10-Q_2023-08-04 in 0.06 sec.


Converted 'data\edgar_documents\WFC\10-Q_2023-08-01' --> 'data\processed_data\WFC\10-Q_2023-08-01.md'
Converted 'data\edgar_documents\WFC\10-Q_2023-08-04' --> 'data\processed_data\WFC\10-Q_2023-08-04.md'


2025-11-14 17:53:38,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:53:43,132 - INFO - Going to convert document batch...
2025-11-14 17:53:43,133 - INFO - Processing document 10-Q_2023-10-31
2025-11-14 17:53:50,947 - INFO - Finished converting document 10-Q_2023-10-31 in 12.33 sec.
2025-11-14 17:53:54,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WFC\10-Q_2023-10-31' --> 'data\processed_data\WFC\10-Q_2023-10-31.md'


2025-11-14 17:53:56,987 - INFO - Going to convert document batch...
2025-11-14 17:53:56,988 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 17:54:02,419 - INFO - Finished converting document 10-Q_2024-05-02 in 8.38 sec.


Converted 'data\edgar_documents\WFC\10-Q_2024-05-02' --> 'data\processed_data\WFC\10-Q_2024-05-02.md'


2025-11-14 17:54:04,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:54:08,962 - INFO - Going to convert document batch...
2025-11-14 17:54:08,963 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 17:54:16,602 - INFO - Finished converting document 10-Q_2024-08-01 in 12.00 sec.


Converted 'data\edgar_documents\WFC\10-Q_2024-08-01' --> 'data\processed_data\WFC\10-Q_2024-08-01.md'


2025-11-14 17:54:19,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:54:22,917 - INFO - Going to convert document batch...
2025-11-14 17:54:22,918 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 17:54:29,946 - INFO - Finished converting document 10-Q_2024-10-31 in 10.86 sec.
2025-11-14 17:54:33,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WFC\10-Q_2024-10-31' --> 'data\processed_data\WFC\10-Q_2024-10-31.md'


2025-11-14 17:54:36,377 - INFO - Going to convert document batch...
2025-11-14 17:54:36,377 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 17:54:41,799 - INFO - Finished converting document 10-Q_2025-04-29 in 8.28 sec.


Converted 'data\edgar_documents\WFC\10-Q_2025-04-29' --> 'data\processed_data\WFC\10-Q_2025-04-29.md'


2025-11-14 17:54:45,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:54:48,064 - INFO - Going to convert document batch...
2025-11-14 17:54:48,065 - INFO - Processing document 10-Q_2025-08-05
2025-11-14 17:54:55,429 - INFO - Finished converting document 10-Q_2025-08-05 in 10.50 sec.


Converted 'data\edgar_documents\WFC\10-Q_2025-08-05' --> 'data\processed_data\WFC\10-Q_2025-08-05.md'


2025-11-14 17:54:58,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:01,519 - INFO - Going to convert document batch...
2025-11-14 17:55:01,520 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 17:55:08,797 - INFO - Finished converting document 10-Q_2025-10-31 in 11.03 sec.
2025-11-14 17:55:11,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:11,144 - INFO - Going to convert document batch...
2025-11-14 17:55:11,145 - INFO - Processing document 4_2023-01-04
2025-11-14 17:55:11,163 - INFO - Finished converting document 4_2023-01-04 in 0.03 sec.
2025-11-14 17:55:11,226 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:11,227 - ERROR - Input document 4_2023-01-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'

Converted 'data\edgar_documents\WFC\10-Q_2025-10-31' --> 'data\processed_data\WFC\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\WFC\4_2023-01-04' --> 'data\processed_data\WFC\4_2023-01-04.md'
Error processing data\edgar_documents\WFC\4_2023-01-17: File format not allowed: data\edgar_documents\WFC\4_2023-01-17
Converted 'data\edgar_documents\WFC\4_2023-01-18' --> 'data\processed_data\WFC\4_2023-01-18.md'


2025-11-14 17:55:11,324 - ERROR - Input document 4_2023-01-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:11,326 - INFO - Going to convert document batch...
2025-11-14 17:55:11,346 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:11,347 - ERROR - Input document 4_2023-01-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2023-01-23: File format not allowed: data\edgar_documents\WFC\4_2023-01-23
Error processing data\edgar_documents\WFC\4_2023-01-24: File format not allowed: data\edgar_documents\WFC\4_2023-01-24
Converted 'data\edgar_documents\WFC\4_2023-01-26' --> 'data\processed_data\WFC\4_2023-01-26.md'
Error processing data\edgar_documents\WFC\4_2023-01-30: File format not allowed: data\edgar_documents\WFC\4_2023-01-30
Converted 'data\edgar_documents\WFC\4_2023-01-31' --> 'data\processed_data\WFC\4_2023-01-31.md'


2025-11-14 17:55:11,526 - ERROR - Input document 4_2023-02-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:11,529 - INFO - Going to convert document batch...
2025-11-14 17:55:11,550 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:11,551 - ERROR - Input document 4_2023-02-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2023-02-06: File format not allowed: data\edgar_documents\WFC\4_2023-02-06
Error processing data\edgar_documents\WFC\4_2023-02-07: File format not allowed: data\edgar_documents\WFC\4_2023-02-07
Error processing data\edgar_documents\WFC\4_2023-02-15: File format not allowed: data\edgar_documents\WFC\4_2023-02-15
Error processing data\edgar_documents\WFC\4_2023-02-16: File format not allowed: data\edgar_documents\WFC\4_2023-02-16
Error processing data\edgar_documents\WFC\4_2023-02-17: File format not allowed: data\edgar_documents\WFC\4_2023-02-17
Error processing data\edgar_documents\WFC\4_2023-02-24: File format not allowed: data\edgar_documents\WFC\4_2023-02-24
Converted 'data\edgar_documents\WFC\4_2023-02-27' --> 'data\processed_data\WFC\4_2023-02-27.md'


2025-11-14 17:55:11,716 - ERROR - Input document 4_2023-02-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:11,717 - INFO - Going to convert document batch...
2025-11-14 17:55:11,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:11,739 - INFO - Going to convert document batch...
2025-11-14 17:55:11,740 - INFO - Processing document 4_2023-03-01
2025-11-14 17:55:11,760 - INFO - Finished converting document 4_2023-03-01 in 0.05 sec.
2025-11-14 17:55:11,810 - INFO - detec

Error processing data\edgar_documents\WFC\4_2023-02-28: File format not allowed: data\edgar_documents\WFC\4_2023-02-28
Converted 'data\edgar_documents\WFC\4_2023-03-01' --> 'data\processed_data\WFC\4_2023-03-01.md'
Converted 'data\edgar_documents\WFC\4_2023-03-03' --> 'data\processed_data\WFC\4_2023-03-03.md'
Error processing data\edgar_documents\WFC\4_2023-03-09: File format not allowed: data\edgar_documents\WFC\4_2023-03-09


2025-11-14 17:55:11,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:11,966 - INFO - Going to convert document batch...
2025-11-14 17:55:11,967 - INFO - Processing document 4_2023-03-31
2025-11-14 17:55:11,996 - INFO - Finished converting document 4_2023-03-31 in 0.06 sec.
2025-11-14 17:55:12,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:12,058 - INFO - Going to convert document batch...
2025-11-14 17:55:12,059 - INFO - Processing document 4_2023-04-04
2025-11-14 17:55:12,082 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.


Converted 'data\edgar_documents\WFC\4_2023-03-17' --> 'data\processed_data\WFC\4_2023-03-17.md'
Converted 'data\edgar_documents\WFC\4_2023-03-31' --> 'data\processed_data\WFC\4_2023-03-31.md'
Converted 'data\edgar_documents\WFC\4_2023-04-04' --> 'data\processed_data\WFC\4_2023-04-04.md'


2025-11-14 17:55:12,133 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:12,134 - ERROR - Input document 4_2023-04-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:12,135 - INFO - Going to convert document batch...
2025-11-14 17:55:12,153 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:12,154 - ERROR - Input document 4_2023-04-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\WFC\4_2023-04-17: File format not allowed: data\edgar_documents\WFC\4_2023-04-17
Error processing data\edgar_documents\WFC\4_2023-04-18: File format not allowed: data\edgar_documents\WFC\4_2023-04-18
Converted 'data\edgar_documents\WFC\4_2023-04-25' --> 'data\processed_data\WFC\4_2023-04-25.md'


2025-11-14 17:55:12,342 - INFO - Finished converting document 4_2023-04-27 in 0.08 sec.
2025-11-14 17:55:12,434 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:12,435 - ERROR - Input document 4_2023-05-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:12,437 - INFO - Going to convert document batch...
2025-11-14 17:55:12,457 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:12,458 - ERROR - Input document 4_2023-05-16 with forma

Converted 'data\edgar_documents\WFC\4_2023-04-27' --> 'data\processed_data\WFC\4_2023-04-27.md'
Error processing data\edgar_documents\WFC\4_2023-05-05: File format not allowed: data\edgar_documents\WFC\4_2023-05-05
Error processing data\edgar_documents\WFC\4_2023-05-16: File format not allowed: data\edgar_documents\WFC\4_2023-05-16
Error processing data\edgar_documents\WFC\4_2023-05-17: File format not allowed: data\edgar_documents\WFC\4_2023-05-17
Error processing data\edgar_documents\WFC\4_2023-05-26: File format not allowed: data\edgar_documents\WFC\4_2023-05-26
Error processing data\edgar_documents\WFC\4_2023-05-30: File format not allowed: data\edgar_documents\WFC\4_2023-05-30
Error processing data\edgar_documents\WFC\4_2023-05-31: File format not allowed: data\edgar_documents\WFC\4_2023-05-31


2025-11-14 17:55:12,613 - INFO - Finished converting document 4_2023-06-01 in 0.05 sec.
2025-11-14 17:55:12,660 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:12,661 - ERROR - Input document 4_2023-06-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:12,662 - INFO - Going to convert document batch...
2025-11-14 17:55:12,674 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:12,674 - ERROR - Input document 4_2023-06-07 with forma

Converted 'data\edgar_documents\WFC\4_2023-06-01' --> 'data\processed_data\WFC\4_2023-06-01.md'
Error processing data\edgar_documents\WFC\4_2023-06-06: File format not allowed: data\edgar_documents\WFC\4_2023-06-06
Error processing data\edgar_documents\WFC\4_2023-06-07: File format not allowed: data\edgar_documents\WFC\4_2023-06-07
Converted 'data\edgar_documents\WFC\4_2023-06-20' --> 'data\processed_data\WFC\4_2023-06-20.md'
Error processing data\edgar_documents\WFC\4_2023-06-21: File format not allowed: data\edgar_documents\WFC\4_2023-06-21
Converted 'data\edgar_documents\WFC\4_2023-07-05' --> 'data\processed_data\WFC\4_2023-07-05.md'


2025-11-14 17:55:12,861 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:12,862 - ERROR - Input document 4_2023-07-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:12,863 - INFO - Going to convert document batch...
2025-11-14 17:55:12,876 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:12,877 - ERROR - Input document 4_2023-07-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\WFC\4_2023-07-17: File format not allowed: data\edgar_documents\WFC\4_2023-07-17
Error processing data\edgar_documents\WFC\4_2023-07-18: File format not allowed: data\edgar_documents\WFC\4_2023-07-18
Error processing data\edgar_documents\WFC\4_2023-07-19: File format not allowed: data\edgar_documents\WFC\4_2023-07-19
Error processing data\edgar_documents\WFC\4_2023-07-25: File format not allowed: data\edgar_documents\WFC\4_2023-07-25
Error processing data\edgar_documents\WFC\4_2023-07-27: File format not allowed: data\edgar_documents\WFC\4_2023-07-27
Error processing data\edgar_documents\WFC\4_2023-08-04: File format not allowed: data\edgar_documents\WFC\4_2023-08-04
Error processing data\edgar_documents\WFC\4_2023-08-10: File format not allowed: data\edgar_documents\WFC\4_2023-08-10
Error processing data\edgar_documents\WFC\4_2023-08-22: File format not allowed: data\edgar_documents\WFC\4_2023-08-22
Error processing data\edgar_documents\WFC\4_2023

2025-11-14 17:55:13,044 - ERROR - Input document 4_2023-08-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:13,045 - INFO - Going to convert document batch...
2025-11-14 17:55:13,060 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:13,060 - ERROR - Input document 4_2023-09-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2023-08-30: File format not allowed: data\edgar_documents\WFC\4_2023-08-30
Error processing data\edgar_documents\WFC\4_2023-09-08: File format not allowed: data\edgar_documents\WFC\4_2023-09-08
Error processing data\edgar_documents\WFC\4_2023-09-11: File format not allowed: data\edgar_documents\WFC\4_2023-09-11
Converted 'data\edgar_documents\WFC\4_2023-09-13' --> 'data\processed_data\WFC\4_2023-09-13.md'
Converted 'data\edgar_documents\WFC\4_2023-09-19' --> 'data\processed_data\WFC\4_2023-09-19.md'


2025-11-14 17:55:13,257 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:13,258 - ERROR - Input document 4_2023-09-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:13,260 - INFO - Going to convert document batch...
2025-11-14 17:55:13,276 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:13,285 - INFO - Going to convert document batch...
2025-11-14 17:55:13,285 - INFO - Processing document 4_2023-10-03
2025-11-14 17:55:13,306 - INFO - Fin

Error processing data\edgar_documents\WFC\4_2023-09-20: File format not allowed: data\edgar_documents\WFC\4_2023-09-20
Converted 'data\edgar_documents\WFC\4_2023-10-03' --> 'data\processed_data\WFC\4_2023-10-03.md'
Converted 'data\edgar_documents\WFC\4_2023-10-11' --> 'data\processed_data\WFC\4_2023-10-11.md'
Error processing data\edgar_documents\WFC\4_2023-10-16: File format not allowed: data\edgar_documents\WFC\4_2023-10-16
Error processing data\edgar_documents\WFC\4_2023-10-17: File format not allowed: data\edgar_documents\WFC\4_2023-10-17


2025-11-14 17:55:13,459 - INFO - Going to convert document batch...
2025-11-14 17:55:13,460 - INFO - Processing document 4_2023-10-24
2025-11-14 17:55:13,484 - INFO - Finished converting document 4_2023-10-24 in 0.05 sec.
2025-11-14 17:55:13,524 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:13,525 - ERROR - Input document 4_2023-10-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:13,526 - INFO - Going to convert document batch...
2025-11-14 17:55:13,541 - IN

Converted 'data\edgar_documents\WFC\4_2023-10-24' --> 'data\processed_data\WFC\4_2023-10-24.md'
Error processing data\edgar_documents\WFC\4_2023-10-25: File format not allowed: data\edgar_documents\WFC\4_2023-10-25
Converted 'data\edgar_documents\WFC\4_2023-10-26' --> 'data\processed_data\WFC\4_2023-10-26.md'
Error processing data\edgar_documents\WFC\4_2023-11-03: File format not allowed: data\edgar_documents\WFC\4_2023-11-03
Error processing data\edgar_documents\WFC\4_2023-11-06: File format not allowed: data\edgar_documents\WFC\4_2023-11-06


2025-11-14 17:55:13,699 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:13,700 - ERROR - Input document 4_2023-11-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:13,701 - INFO - Going to convert document batch...
2025-11-14 17:55:13,715 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:13,716 - ERROR - Input document 4_2023-11-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\WFC\4_2023-11-09' --> 'data\processed_data\WFC\4_2023-11-09.md'
Error processing data\edgar_documents\WFC\4_2023-11-14: File format not allowed: data\edgar_documents\WFC\4_2023-11-14
Error processing data\edgar_documents\WFC\4_2023-11-22: File format not allowed: data\edgar_documents\WFC\4_2023-11-22
Error processing data\edgar_documents\WFC\4_2023-11-30: File format not allowed: data\edgar_documents\WFC\4_2023-11-30
Error processing data\edgar_documents\WFC\4_2023-12-01: File format not allowed: data\edgar_documents\WFC\4_2023-12-01
Error processing data\edgar_documents\WFC\4_2023-12-04: File format not allowed: data\edgar_documents\WFC\4_2023-12-04
Error processing data\edgar_documents\WFC\4_2023-12-12: File format not allowed: data\edgar_documents\WFC\4_2023-12-12
Error processing data\edgar_documents\WFC\4_2023-12-14: File format not allowed: data\edgar_documents\WFC\4_2023-12-14
Error processing data\edgar_documents\WFC\4_2023-12-21: File format not

2025-11-14 17:55:13,902 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:13,903 - ERROR - Input document 4_2024-01-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:13,906 - INFO - Going to convert document batch...
2025-11-14 17:55:13,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:13,932 - INFO - Going to convert document batch...
2025-11-14 17:55:13,934 - INFO - Processing document 4_2024-01-17
2025-11-14 17:55:13,959 - INFO - Fin

Error processing data\edgar_documents\WFC\4_2024-01-16: File format not allowed: data\edgar_documents\WFC\4_2024-01-16
Converted 'data\edgar_documents\WFC\4_2024-01-17' --> 'data\processed_data\WFC\4_2024-01-17.md'
Converted 'data\edgar_documents\WFC\4_2024-01-25' --> 'data\processed_data\WFC\4_2024-01-25.md'


2025-11-14 17:55:14,103 - ERROR - Input document 4_2024-01-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:14,104 - INFO - Going to convert document batch...
2025-11-14 17:55:14,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:14,126 - INFO - Going to convert document batch...
2025-11-14 17:55:14,127 - INFO - Processing document 4_2024-01-30
2025-11-14 17:55:14,152 - INFO - Finished converting document 4_2024-01-30 in 0.05 sec.
2025-11-14 17:55:14,188 - INFO - detec

Error processing data\edgar_documents\WFC\4_2024-01-29: File format not allowed: data\edgar_documents\WFC\4_2024-01-29
Converted 'data\edgar_documents\WFC\4_2024-01-30' --> 'data\processed_data\WFC\4_2024-01-30.md'
Error processing data\edgar_documents\WFC\4_2024-02-02: File format not allowed: data\edgar_documents\WFC\4_2024-02-02
Converted 'data\edgar_documents\WFC\4_2024-02-07' --> 'data\processed_data\WFC\4_2024-02-07.md'
Error processing data\edgar_documents\WFC\4_2024-02-14: File format not allowed: data\edgar_documents\WFC\4_2024-02-14


2025-11-14 17:55:14,306 - INFO - Going to convert document batch...
2025-11-14 17:55:14,307 - INFO - Processing document 4_2024-02-15
2025-11-14 17:55:14,337 - INFO - Finished converting document 4_2024-02-15 in 0.05 sec.
2025-11-14 17:55:14,396 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:14,397 - ERROR - Input document 4_2024-02-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:14,399 - INFO - Going to convert document batch...
2025-11-14 17:55:14,417 - IN

Converted 'data\edgar_documents\WFC\4_2024-02-15' --> 'data\processed_data\WFC\4_2024-02-15.md'
Error processing data\edgar_documents\WFC\4_2024-02-22: File format not allowed: data\edgar_documents\WFC\4_2024-02-22
Converted 'data\edgar_documents\WFC\4_2024-02-23' --> 'data\processed_data\WFC\4_2024-02-23.md'
Error processing data\edgar_documents\WFC\4_2024-02-28: File format not allowed: data\edgar_documents\WFC\4_2024-02-28


2025-11-14 17:55:14,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:14,615 - INFO - Going to convert document batch...
2025-11-14 17:55:14,616 - INFO - Processing document 4_2024-03-01
2025-11-14 17:55:14,653 - INFO - Finished converting document 4_2024-03-01 in 0.06 sec.
2025-11-14 17:55:14,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:14,715 - INFO - Going to convert document batch...
2025-11-14 17:55:14,716 - INFO - Processing document 4_2024-03-05
2025-11-14 17:55:14,745 - INFO - Finished converting document 4_2024-03-05 in 0.06 sec.


Converted 'data\edgar_documents\WFC\4_2024-02-29' --> 'data\processed_data\WFC\4_2024-02-29.md'
Converted 'data\edgar_documents\WFC\4_2024-03-01' --> 'data\processed_data\WFC\4_2024-03-01.md'
Converted 'data\edgar_documents\WFC\4_2024-03-05' --> 'data\processed_data\WFC\4_2024-03-05.md'


2025-11-14 17:55:14,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:14,808 - INFO - Going to convert document batch...
2025-11-14 17:55:14,809 - INFO - Processing document 4_2024-03-07
2025-11-14 17:55:14,830 - INFO - Finished converting document 4_2024-03-07 in 0.06 sec.
2025-11-14 17:55:14,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:14,879 - INFO - Going to convert document batch...
2025-11-14 17:55:14,879 - INFO - Processing document 4_2024-03-12
2025-11-14 17:55:14,901 - INFO - Finished converting document 4_2024-03-12 in 0.06 sec.
2025-11-14 17:55:14,937 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:14,938 - ERROR - Input document 4_2024-03-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\WFC\4_2024-03-07' --> 'data\processed_data\WFC\4_2024-03-07.md'
Converted 'data\edgar_documents\WFC\4_2024-03-12' --> 'data\processed_data\WFC\4_2024-03-12.md'
Error processing data\edgar_documents\WFC\4_2024-03-13: File format not allowed: data\edgar_documents\WFC\4_2024-03-13
Converted 'data\edgar_documents\WFC\4_2024-03-19' --> 'data\processed_data\WFC\4_2024-03-19.md'
Error processing data\edgar_documents\WFC\4_2024-03-21: File format not allowed: data\edgar_documents\WFC\4_2024-03-21


2025-11-14 17:55:15,031 - ERROR - Input document 4_2024-03-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:15,033 - INFO - Going to convert document batch...
2025-11-14 17:55:15,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:15,056 - INFO - Going to convert document batch...
2025-11-14 17:55:15,056 - INFO - Processing document 4_2024-03-28
2025-11-14 17:55:15,088 - INFO - Finished converting document 4_2024-03-28 in 0.06 sec.
2025-11-14 17:55:15,130 - INFO - detec

Error processing data\edgar_documents\WFC\4_2024-03-22: File format not allowed: data\edgar_documents\WFC\4_2024-03-22
Converted 'data\edgar_documents\WFC\4_2024-03-28' --> 'data\processed_data\WFC\4_2024-03-28.md'
Converted 'data\edgar_documents\WFC\4_2024-04-03' --> 'data\processed_data\WFC\4_2024-04-03.md'
Error processing data\edgar_documents\WFC\4_2024-04-15: File format not allowed: data\edgar_documents\WFC\4_2024-04-15


2025-11-14 17:55:15,221 - ERROR - Input document 4_2024-04-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:15,223 - INFO - Going to convert document batch...
2025-11-14 17:55:15,252 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:15,253 - ERROR - Input document 4_2024-04-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2024-04-16: File format not allowed: data\edgar_documents\WFC\4_2024-04-16
Error processing data\edgar_documents\WFC\4_2024-04-17: File format not allowed: data\edgar_documents\WFC\4_2024-04-17
Error processing data\edgar_documents\WFC\4_2024-04-23: File format not allowed: data\edgar_documents\WFC\4_2024-04-23
Error processing data\edgar_documents\WFC\4_2024-04-25: File format not allowed: data\edgar_documents\WFC\4_2024-04-25
Error processing data\edgar_documents\WFC\4_2024-04-26: File format not allowed: data\edgar_documents\WFC\4_2024-04-26
Converted 'data\edgar_documents\WFC\4_2024-05-01' --> 'data\processed_data\WFC\4_2024-05-01.md'


2025-11-14 17:55:15,400 - INFO - Processing document 4_2024-05-02
2025-11-14 17:55:15,419 - INFO - Finished converting document 4_2024-05-02 in 0.05 sec.
2025-11-14 17:55:15,454 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:15,454 - ERROR - Input document 4_2024-05-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:15,456 - INFO - Going to convert document batch...
2025-11-14 17:55:15,476 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\WFC\4_2024-05-02' --> 'data\processed_data\WFC\4_2024-05-02.md'
Error processing data\edgar_documents\WFC\4_2024-05-03: File format not allowed: data\edgar_documents\WFC\4_2024-05-03
Error processing data\edgar_documents\WFC\4_2024-05-06: File format not allowed: data\edgar_documents\WFC\4_2024-05-06
Converted 'data\edgar_documents\WFC\4_2024-05-07' --> 'data\processed_data\WFC\4_2024-05-07.md'


2025-11-14 17:55:15,645 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:15,645 - ERROR - Input document 4_2024-05-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:15,646 - INFO - Going to convert document batch...
2025-11-14 17:55:15,659 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:15,660 - ERROR - Input document 4_2024-05-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\WFC\4_2024-05-10' --> 'data\processed_data\WFC\4_2024-05-10.md'
Error processing data\edgar_documents\WFC\4_2024-05-15: File format not allowed: data\edgar_documents\WFC\4_2024-05-15
Error processing data\edgar_documents\WFC\4_2024-05-17: File format not allowed: data\edgar_documents\WFC\4_2024-05-17
Error processing data\edgar_documents\WFC\4_2024-05-20: File format not allowed: data\edgar_documents\WFC\4_2024-05-20
Error processing data\edgar_documents\WFC\4_2024-05-24: File format not allowed: data\edgar_documents\WFC\4_2024-05-24
Error processing data\edgar_documents\WFC\4_2024-05-28: File format not allowed: data\edgar_documents\WFC\4_2024-05-28
Error processing data\edgar_documents\WFC\4_2024-05-30: File format not allowed: data\edgar_documents\WFC\4_2024-05-30


2025-11-14 17:55:15,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:15,854 - INFO - Going to convert document batch...
2025-11-14 17:55:15,855 - INFO - Processing document 4_2024-06-10
2025-11-14 17:55:15,875 - INFO - Finished converting document 4_2024-06-10 in 0.05 sec.
2025-11-14 17:55:15,908 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:15,909 - ERROR - Input document 4_2024-06-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55

Converted 'data\edgar_documents\WFC\4_2024-06-07' --> 'data\processed_data\WFC\4_2024-06-07.md'
Converted 'data\edgar_documents\WFC\4_2024-06-10' --> 'data\processed_data\WFC\4_2024-06-10.md'
Error processing data\edgar_documents\WFC\4_2024-06-12: File format not allowed: data\edgar_documents\WFC\4_2024-06-12
Converted 'data\edgar_documents\WFC\4_2024-06-14' --> 'data\processed_data\WFC\4_2024-06-14.md'


2025-11-14 17:55:16,013 - INFO - Processing document 4_2024-06-18
2025-11-14 17:55:16,033 - INFO - Finished converting document 4_2024-06-18 in 0.05 sec.
2025-11-14 17:55:16,068 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:16,069 - ERROR - Input document 4_2024-06-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:16,070 - INFO - Going to convert document batch...
2025-11-14 17:55:16,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55

Converted 'data\edgar_documents\WFC\4_2024-06-18' --> 'data\processed_data\WFC\4_2024-06-18.md'
Error processing data\edgar_documents\WFC\4_2024-06-20: File format not allowed: data\edgar_documents\WFC\4_2024-06-20
Converted 'data\edgar_documents\WFC\4_2024-06-27' --> 'data\processed_data\WFC\4_2024-06-27.md'
Converted 'data\edgar_documents\WFC\4_2024-07-02' --> 'data\processed_data\WFC\4_2024-07-02.md'


2025-11-14 17:55:16,248 - INFO - Finished converting document 4_2024-07-03 in 0.05 sec.
2025-11-14 17:55:16,283 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:16,284 - ERROR - Input document 4_2024-07-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:16,285 - INFO - Going to convert document batch...
2025-11-14 17:55:16,320 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:16,320 - ERROR - Input document 4_2024-07-16 with forma

Converted 'data\edgar_documents\WFC\4_2024-07-03' --> 'data\processed_data\WFC\4_2024-07-03.md'
Error processing data\edgar_documents\WFC\4_2024-07-15: File format not allowed: data\edgar_documents\WFC\4_2024-07-15
Error processing data\edgar_documents\WFC\4_2024-07-16: File format not allowed: data\edgar_documents\WFC\4_2024-07-16
Error processing data\edgar_documents\WFC\4_2024-07-17: File format not allowed: data\edgar_documents\WFC\4_2024-07-17
Error processing data\edgar_documents\WFC\4_2024-07-19: File format not allowed: data\edgar_documents\WFC\4_2024-07-19
Error processing data\edgar_documents\WFC\4_2024-07-23: File format not allowed: data\edgar_documents\WFC\4_2024-07-23
Error processing data\edgar_documents\WFC\4_2024-07-25: File format not allowed: data\edgar_documents\WFC\4_2024-07-25
Error processing data\edgar_documents\WFC\4_2024-07-31: File format not allowed: data\edgar_documents\WFC\4_2024-07-31
Error processing data\edgar_documents\WFC\4_2024-08-06: File format not

2025-11-14 17:55:16,457 - ERROR - Input document 4_2024-08-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:16,458 - INFO - Going to convert document batch...
2025-11-14 17:55:16,471 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:16,472 - ERROR - Input document 4_2024-08-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2024-08-08: File format not allowed: data\edgar_documents\WFC\4_2024-08-08
Error processing data\edgar_documents\WFC\4_2024-08-12: File format not allowed: data\edgar_documents\WFC\4_2024-08-12
Error processing data\edgar_documents\WFC\4_2024-08-13: File format not allowed: data\edgar_documents\WFC\4_2024-08-13
Error processing data\edgar_documents\WFC\4_2024-08-15: File format not allowed: data\edgar_documents\WFC\4_2024-08-15
Error processing data\edgar_documents\WFC\4_2024-08-21: File format not allowed: data\edgar_documents\WFC\4_2024-08-21
Error processing data\edgar_documents\WFC\4_2024-08-22: File format not allowed: data\edgar_documents\WFC\4_2024-08-22
Converted 'data\edgar_documents\WFC\4_2024-08-23' --> 'data\processed_data\WFC\4_2024-08-23.md'
Error processing data\edgar_documents\WFC\4_2024-08-27: File format not allowed: data\edgar_documents\WFC\4_2024-08-27
Error processing data\edgar_documents\WFC\4_2024-08-28: File format not

2025-11-14 17:55:16,644 - ERROR - Input document 4_2024-08-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:16,645 - INFO - Going to convert document batch...
2025-11-14 17:55:16,657 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:16,658 - ERROR - Input document 4_2024-09-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2024-08-29: File format not allowed: data\edgar_documents\WFC\4_2024-08-29
Error processing data\edgar_documents\WFC\4_2024-09-03: File format not allowed: data\edgar_documents\WFC\4_2024-09-03
Error processing data\edgar_documents\WFC\4_2024-09-06: File format not allowed: data\edgar_documents\WFC\4_2024-09-06
Error processing data\edgar_documents\WFC\4_2024-09-10: File format not allowed: data\edgar_documents\WFC\4_2024-09-10
Error processing data\edgar_documents\WFC\4_2024-09-11: File format not allowed: data\edgar_documents\WFC\4_2024-09-11
Error processing data\edgar_documents\WFC\4_2024-09-12: File format not allowed: data\edgar_documents\WFC\4_2024-09-12
Error processing data\edgar_documents\WFC\4_2024-09-16: File format not allowed: data\edgar_documents\WFC\4_2024-09-16
Error processing data\edgar_documents\WFC\4_2024-09-19: File format not allowed: data\edgar_documents\WFC\4_2024-09-19
Error processing data\edgar_documents\WFC\4_2024

2025-11-14 17:55:16,839 - INFO - Finished converting document 4_2024-10-01 in 0.06 sec.
2025-11-14 17:55:16,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:16,886 - INFO - Going to convert document batch...
2025-11-14 17:55:16,887 - INFO - Processing document 4_2024-10-03
2025-11-14 17:55:16,912 - INFO - Finished converting document 4_2024-10-03 in 0.05 sec.
2025-11-14 17:55:16,950 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:16,951 - ERROR - Input document 4_2024-10-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\WFC\4_2024-10-01' --> 'data\processed_data\WFC\4_2024-10-01.md'
Converted 'data\edgar_documents\WFC\4_2024-10-03' --> 'data\processed_data\WFC\4_2024-10-03.md'
Error processing data\edgar_documents\WFC\4_2024-10-15: File format not allowed: data\edgar_documents\WFC\4_2024-10-15
Converted 'data\edgar_documents\WFC\4_2024-10-16' --> 'data\processed_data\WFC\4_2024-10-16.md'


2025-11-14 17:55:17,053 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:17,054 - ERROR - Input document 4_2024-10-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:17,055 - INFO - Going to convert document batch...
2025-11-14 17:55:17,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:17,077 - INFO - Going to convert document batch...
2025-11-14 17:55:17,078 - INFO - Processing document 4_2024-10-23
2025-11-14 17:55:17,102 - INFO - Fin

Error processing data\edgar_documents\WFC\4_2024-10-17: File format not allowed: data\edgar_documents\WFC\4_2024-10-17
Error processing data\edgar_documents\WFC\4_2024-10-22: File format not allowed: data\edgar_documents\WFC\4_2024-10-22
Converted 'data\edgar_documents\WFC\4_2024-10-23' --> 'data\processed_data\WFC\4_2024-10-23.md'
Converted 'data\edgar_documents\WFC\4_2024-10-24' --> 'data\processed_data\WFC\4_2024-10-24.md'
Error processing data\edgar_documents\WFC\4_2024-10-25: File format not allowed: data\edgar_documents\WFC\4_2024-10-25
Error processing data\edgar_documents\WFC\4_2024-10-31: File format not allowed: data\edgar_documents\WFC\4_2024-10-31


2025-11-14 17:55:17,230 - INFO - Going to convert document batch...
2025-11-14 17:55:17,242 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:17,242 - ERROR - Input document 4_2024-11-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:17,243 - INFO - Going to convert document batch...
2025-11-14 17:55:17,258 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:17,259 - ERROR - Input document 4_2024-11-08 with format None does not matc

Error processing data\edgar_documents\WFC\4_2024-11-01: File format not allowed: data\edgar_documents\WFC\4_2024-11-01
Error processing data\edgar_documents\WFC\4_2024-11-06: File format not allowed: data\edgar_documents\WFC\4_2024-11-06
Error processing data\edgar_documents\WFC\4_2024-11-08: File format not allowed: data\edgar_documents\WFC\4_2024-11-08
Error processing data\edgar_documents\WFC\4_2024-11-13: File format not allowed: data\edgar_documents\WFC\4_2024-11-13
Error processing data\edgar_documents\WFC\4_2024-11-15: File format not allowed: data\edgar_documents\WFC\4_2024-11-15
Error processing data\edgar_documents\WFC\4_2024-11-18: File format not allowed: data\edgar_documents\WFC\4_2024-11-18
Error processing data\edgar_documents\WFC\4_2024-11-19: File format not allowed: data\edgar_documents\WFC\4_2024-11-19
Error processing data\edgar_documents\WFC\4_2024-11-20: File format not allowed: data\edgar_documents\WFC\4_2024-11-20
Error processing data\edgar_documents\WFC\4_2024

2025-11-14 17:55:17,434 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:17,434 - ERROR - Input document 4_2024-11-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:17,435 - INFO - Going to convert document batch...
2025-11-14 17:55:17,449 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:17,450 - ERROR - Input document 4_2024-11-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\WFC\4_2024-11-25: File format not allowed: data\edgar_documents\WFC\4_2024-11-25
Error processing data\edgar_documents\WFC\4_2024-11-29: File format not allowed: data\edgar_documents\WFC\4_2024-11-29
Error processing data\edgar_documents\WFC\4_2024-12-03: File format not allowed: data\edgar_documents\WFC\4_2024-12-03
Error processing data\edgar_documents\WFC\4_2024-12-06: File format not allowed: data\edgar_documents\WFC\4_2024-12-06
Error processing data\edgar_documents\WFC\4_2024-12-09: File format not allowed: data\edgar_documents\WFC\4_2024-12-09
Converted 'data\edgar_documents\WFC\4_2024-12-11' --> 'data\processed_data\WFC\4_2024-12-11.md'


2025-11-14 17:55:17,633 - INFO - Finished converting document 4_2024-12-12 in 0.05 sec.
2025-11-14 17:55:17,701 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:17,702 - ERROR - Input document 4_2024-12-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:17,703 - INFO - Going to convert document batch...
2025-11-14 17:55:17,727 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:17,728 - ERROR - Input document 4_2024-12-19 with forma

Converted 'data\edgar_documents\WFC\4_2024-12-12' --> 'data\processed_data\WFC\4_2024-12-12.md'
Error processing data\edgar_documents\WFC\4_2024-12-13: File format not allowed: data\edgar_documents\WFC\4_2024-12-13
Error processing data\edgar_documents\WFC\4_2024-12-19: File format not allowed: data\edgar_documents\WFC\4_2024-12-19
Error processing data\edgar_documents\WFC\4_2024-12-20: File format not allowed: data\edgar_documents\WFC\4_2024-12-20
Converted 'data\edgar_documents\WFC\4_2025-01-03' --> 'data\processed_data\WFC\4_2025-01-03.md'
Error processing data\edgar_documents\WFC\4_2025-01-16: File format not allowed: data\edgar_documents\WFC\4_2025-01-16


2025-11-14 17:55:17,861 - ERROR - Input document 4_2025-01-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:17,862 - INFO - Going to convert document batch...
2025-11-14 17:55:17,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:17,887 - INFO - Going to convert document batch...
2025-11-14 17:55:17,888 - INFO - Processing document 4_2025-01-30
2025-11-14 17:55:17,910 - INFO - Finished converting document 4_2025-01-30 in 0.05 sec.
2025-11-14 17:55:17,947 - INFO - detec

Error processing data\edgar_documents\WFC\4_2025-01-17: File format not allowed: data\edgar_documents\WFC\4_2025-01-17
Converted 'data\edgar_documents\WFC\4_2025-01-30' --> 'data\processed_data\WFC\4_2025-01-30.md'
Error processing data\edgar_documents\WFC\4_2025-01-31: File format not allowed: data\edgar_documents\WFC\4_2025-01-31
Error processing data\edgar_documents\WFC\4_2025-02-03: File format not allowed: data\edgar_documents\WFC\4_2025-02-03
Error processing data\edgar_documents\WFC\4_2025-02-04: File format not allowed: data\edgar_documents\WFC\4_2025-02-04


2025-11-14 17:55:18,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:18,095 - INFO - Going to convert document batch...
2025-11-14 17:55:18,096 - INFO - Processing document 4_2025-02-11
2025-11-14 17:55:18,119 - INFO - Finished converting document 4_2025-02-11 in 0.05 sec.
2025-11-14 17:55:18,160 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:18,161 - ERROR - Input document 4_2025-02-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55

Converted 'data\edgar_documents\WFC\4_2025-02-07' --> 'data\processed_data\WFC\4_2025-02-07.md'
Converted 'data\edgar_documents\WFC\4_2025-02-11' --> 'data\processed_data\WFC\4_2025-02-11.md'
Error processing data\edgar_documents\WFC\4_2025-02-12: File format not allowed: data\edgar_documents\WFC\4_2025-02-12
Error processing data\edgar_documents\WFC\4_2025-02-13: File format not allowed: data\edgar_documents\WFC\4_2025-02-13
Error processing data\edgar_documents\WFC\4_2025-02-20: File format not allowed: data\edgar_documents\WFC\4_2025-02-20


2025-11-14 17:55:18,291 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:18,292 - ERROR - Input document 4_2025-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:18,293 - INFO - Going to convert document batch...
2025-11-14 17:55:18,307 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:18,308 - ERROR - Input document 4_2025-03-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\WFC\4_2025-02-26' --> 'data\processed_data\WFC\4_2025-02-26.md'
Error processing data\edgar_documents\WFC\4_2025-02-27: File format not allowed: data\edgar_documents\WFC\4_2025-02-27
Error processing data\edgar_documents\WFC\4_2025-03-04: File format not allowed: data\edgar_documents\WFC\4_2025-03-04
Converted 'data\edgar_documents\WFC\4_2025-03-07' --> 'data\processed_data\WFC\4_2025-03-07.md'
Converted 'data\edgar_documents\WFC\4_2025-03-11' --> 'data\processed_data\WFC\4_2025-03-11.md'


2025-11-14 17:55:18,466 - ERROR - Input document 4_2025-03-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:18,467 - INFO - Going to convert document batch...
2025-11-14 17:55:18,481 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:18,481 - ERROR - Input document 4_2025-03-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2025-03-12: File format not allowed: data\edgar_documents\WFC\4_2025-03-12
Error processing data\edgar_documents\WFC\4_2025-03-14: File format not allowed: data\edgar_documents\WFC\4_2025-03-14
Error processing data\edgar_documents\WFC\4_2025-03-21: File format not allowed: data\edgar_documents\WFC\4_2025-03-21
Error processing data\edgar_documents\WFC\4_2025-03-24: File format not allowed: data\edgar_documents\WFC\4_2025-03-24
Converted 'data\edgar_documents\WFC\4_2025-04-03' --> 'data\processed_data\WFC\4_2025-04-03.md'
Error processing data\edgar_documents\WFC\4_2025-04-14: File format not allowed: data\edgar_documents\WFC\4_2025-04-14
Error processing data\edgar_documents\WFC\4_2025-04-15: File format not allowed: data\edgar_documents\WFC\4_2025-04-15


2025-11-14 17:55:18,654 - ERROR - Input document 4_2025-04-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:18,655 - INFO - Going to convert document batch...
2025-11-14 17:55:18,668 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:18,668 - ERROR - Input document 4_2025-04-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2025-04-16: File format not allowed: data\edgar_documents\WFC\4_2025-04-16
Error processing data\edgar_documents\WFC\4_2025-04-23: File format not allowed: data\edgar_documents\WFC\4_2025-04-23
Error processing data\edgar_documents\WFC\4_2025-04-25: File format not allowed: data\edgar_documents\WFC\4_2025-04-25
Error processing data\edgar_documents\WFC\4_2025-04-28: File format not allowed: data\edgar_documents\WFC\4_2025-04-28
Error processing data\edgar_documents\WFC\4_2025-04-29: File format not allowed: data\edgar_documents\WFC\4_2025-04-29
Converted 'data\edgar_documents\WFC\4_2025-05-01' --> 'data\processed_data\WFC\4_2025-05-01.md'
Error processing data\edgar_documents\WFC\4_2025-05-07: File format not allowed: data\edgar_documents\WFC\4_2025-05-07
Error processing data\edgar_documents\WFC\4_2025-05-08: File format not allowed: data\edgar_documents\WFC\4_2025-05-08
Error processing data\edgar_documents\WFC\4_2025-05-19: File format not

2025-11-14 17:55:18,844 - ERROR - Input document 4_2025-05-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:18,845 - INFO - Going to convert document batch...
2025-11-14 17:55:18,858 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:18,859 - ERROR - Input document 4_2025-05-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2025-05-21: File format not allowed: data\edgar_documents\WFC\4_2025-05-21
Error processing data\edgar_documents\WFC\4_2025-05-29: File format not allowed: data\edgar_documents\WFC\4_2025-05-29
Error processing data\edgar_documents\WFC\4_2025-06-04: File format not allowed: data\edgar_documents\WFC\4_2025-06-04
Error processing data\edgar_documents\WFC\4_2025-06-05: File format not allowed: data\edgar_documents\WFC\4_2025-06-05
Error processing data\edgar_documents\WFC\4_2025-06-13: File format not allowed: data\edgar_documents\WFC\4_2025-06-13
Error processing data\edgar_documents\WFC\4_2025-06-16: File format not allowed: data\edgar_documents\WFC\4_2025-06-16
Converted 'data\edgar_documents\WFC\4_2025-06-17' --> 'data\processed_data\WFC\4_2025-06-17.md'


2025-11-14 17:55:19,028 - INFO - Processing document 4_2025-06-18
2025-11-14 17:55:19,048 - INFO - Finished converting document 4_2025-06-18 in 0.05 sec.
2025-11-14 17:55:19,085 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:19,087 - ERROR - Input document 4_2025-06-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:19,090 - INFO - Going to convert document batch...
2025-11-14 17:55:19,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55

Converted 'data\edgar_documents\WFC\4_2025-06-18' --> 'data\processed_data\WFC\4_2025-06-18.md'
Error processing data\edgar_documents\WFC\4_2025-06-27: File format not allowed: data\edgar_documents\WFC\4_2025-06-27
Converted 'data\edgar_documents\WFC\4_2025-07-03' --> 'data\processed_data\WFC\4_2025-07-03.md'
Error processing data\edgar_documents\WFC\4_2025-07-08: File format not allowed: data\edgar_documents\WFC\4_2025-07-08
Error processing data\edgar_documents\WFC\4_2025-07-09: File format not allowed: data\edgar_documents\WFC\4_2025-07-09
Error processing data\edgar_documents\WFC\4_2025-07-17: File format not allowed: data\edgar_documents\WFC\4_2025-07-17


2025-11-14 17:55:19,246 - ERROR - Input document 4_2025-07-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:19,247 - INFO - Going to convert document batch...
2025-11-14 17:55:19,261 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:19,262 - ERROR - Input document 4_2025-07-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2025-07-21: File format not allowed: data\edgar_documents\WFC\4_2025-07-21
Error processing data\edgar_documents\WFC\4_2025-07-22: File format not allowed: data\edgar_documents\WFC\4_2025-07-22
Converted 'data\edgar_documents\WFC\4_2025-07-30' --> 'data\processed_data\WFC\4_2025-07-30.md'


2025-11-14 17:55:19,477 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:19,478 - ERROR - Input document 4_2025-08-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:19,479 - INFO - Going to convert document batch...
2025-11-14 17:55:19,495 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:19,496 - ERROR - Input document 4_2025-08-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\WFC\4_2025-07-31' --> 'data\processed_data\WFC\4_2025-07-31.md'
Error processing data\edgar_documents\WFC\4_2025-08-01: File format not allowed: data\edgar_documents\WFC\4_2025-08-01
Error processing data\edgar_documents\WFC\4_2025-08-04: File format not allowed: data\edgar_documents\WFC\4_2025-08-04
Converted 'data\edgar_documents\WFC\4_2025-08-05' --> 'data\processed_data\WFC\4_2025-08-05.md'
Error processing data\edgar_documents\WFC\4_2025-08-14: File format not allowed: data\edgar_documents\WFC\4_2025-08-14
Error processing data\edgar_documents\WFC\4_2025-08-27: File format not allowed: data\edgar_documents\WFC\4_2025-08-27
Error processing data\edgar_documents\WFC\4_2025-08-28: File format not allowed: data\edgar_documents\WFC\4_2025-08-28
Error processing data\edgar_documents\WFC\4_2025-09-08: File format not allowed: data\edgar_documents\WFC\4_2025-09-08


2025-11-14 17:55:19,659 - ERROR - Input document 4_2025-09-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:19,660 - INFO - Going to convert document batch...
2025-11-14 17:55:19,673 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:19,673 - ERROR - Input document 4_2025-09-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\WFC\4_2025-09-10: File format not allowed: data\edgar_documents\WFC\4_2025-09-10
Error processing data\edgar_documents\WFC\4_2025-09-11: File format not allowed: data\edgar_documents\WFC\4_2025-09-11
Error processing data\edgar_documents\WFC\4_2025-09-12: File format not allowed: data\edgar_documents\WFC\4_2025-09-12
Error processing data\edgar_documents\WFC\4_2025-09-16: File format not allowed: data\edgar_documents\WFC\4_2025-09-16
Error processing data\edgar_documents\WFC\4_2025-09-17: File format not allowed: data\edgar_documents\WFC\4_2025-09-17
Error processing data\edgar_documents\WFC\4_2025-09-19: File format not allowed: data\edgar_documents\WFC\4_2025-09-19
Error processing data\edgar_documents\WFC\4_2025-09-23: File format not allowed: data\edgar_documents\WFC\4_2025-09-23
Error processing data\edgar_documents\WFC\4_2025-09-24: File format not allowed: data\edgar_documents\WFC\4_2025-09-24
Error processing data\edgar_documents\WFC\4_2025

2025-11-14 17:55:19,886 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:19,887 - ERROR - Input document 4_2025-10-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:19,888 - INFO - Going to convert document batch...
2025-11-14 17:55:19,902 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:19,903 - ERROR - Input document 4_2025-10-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\WFC\4_2025-10-03' --> 'data\processed_data\WFC\4_2025-10-03.md'
Error processing data\edgar_documents\WFC\4_2025-10-06: File format not allowed: data\edgar_documents\WFC\4_2025-10-06
Error processing data\edgar_documents\WFC\4_2025-10-16: File format not allowed: data\edgar_documents\WFC\4_2025-10-16
Error processing data\edgar_documents\WFC\4_2025-10-29: File format not allowed: data\edgar_documents\WFC\4_2025-10-29
Error processing data\edgar_documents\WFC\4_2025-10-30: File format not allowed: data\edgar_documents\WFC\4_2025-10-30
Error processing data\edgar_documents\WFC\4_2025-10-31: File format not allowed: data\edgar_documents\WFC\4_2025-10-31
Error processing data\edgar_documents\WFC\4_2025-11-03: File format not allowed: data\edgar_documents\WFC\4_2025-11-03
Converted 'data\edgar_documents\WFC\8-K_2023-01-13' --> 'data\processed_data\WFC\8-K_2023-01-13.md'


2025-11-14 17:55:20,073 - INFO - Processing document 8-K_2023-01-26
2025-11-14 17:55:20,097 - INFO - Finished converting document 8-K_2023-01-26 in 0.05 sec.
2025-11-14 17:55:20,126 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,141 - INFO - Going to convert document batch...
2025-11-14 17:55:20,141 - INFO - Processing document 8-K_2023-02-17
2025-11-14 17:55:20,163 - INFO - Finished converting document 8-K_2023-02-17 in 0.05 sec.
2025-11-14 17:55:20,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,208 - INFO - Going to convert document batch...
2025-11-14 17:55:20,209 - INFO - Processing document 8-K_2023-02-24
2025-11-14 17:55:20,228 - INFO - Finished converting document 8-K_2023-02-24 in 0.05 sec.
2025-11-14 17:55:20,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,289 - INFO - Going to convert document batch...
2025-11-14 17:55:20,290 - INFO - Processing document 8-K_2023-04-13


Converted 'data\edgar_documents\WFC\8-K_2023-01-26' --> 'data\processed_data\WFC\8-K_2023-01-26.md'
Converted 'data\edgar_documents\WFC\8-K_2023-02-17' --> 'data\processed_data\WFC\8-K_2023-02-17.md'
Converted 'data\edgar_documents\WFC\8-K_2023-02-24' --> 'data\processed_data\WFC\8-K_2023-02-24.md'


2025-11-14 17:55:20,314 - INFO - Finished converting document 8-K_2023-04-13 in 0.08 sec.
2025-11-14 17:55:20,339 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,354 - INFO - Going to convert document batch...
2025-11-14 17:55:20,355 - INFO - Processing document 8-K_2023-04-14
2025-11-14 17:55:20,379 - INFO - Finished converting document 8-K_2023-04-14 in 0.05 sec.
2025-11-14 17:55:20,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,428 - INFO - Going to convert document batch...
2025-11-14 17:55:20,429 - INFO - Processing document 8-K_2023-04-24
2025-11-14 17:55:20,455 - INFO - Finished converting document 8-K_2023-04-24 in 0.06 sec.
2025-11-14 17:55:20,481 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,497 - INFO - Going to convert document batch...
2025-11-14 17:55:20,498 - INFO - Processing document 8-K_2023-04-27


Converted 'data\edgar_documents\WFC\8-K_2023-04-13' --> 'data\processed_data\WFC\8-K_2023-04-13.md'
Converted 'data\edgar_documents\WFC\8-K_2023-04-14' --> 'data\processed_data\WFC\8-K_2023-04-14.md'
Converted 'data\edgar_documents\WFC\8-K_2023-04-24' --> 'data\processed_data\WFC\8-K_2023-04-24.md'


2025-11-14 17:55:20,520 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 17:55:20,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,565 - INFO - Going to convert document batch...
2025-11-14 17:55:20,566 - INFO - Processing document 8-K_2023-05-12
2025-11-14 17:55:20,593 - INFO - Finished converting document 8-K_2023-05-12 in 0.06 sec.
2025-11-14 17:55:20,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,639 - INFO - Going to convert document batch...
2025-11-14 17:55:20,640 - INFO - Processing document 8-K_2023-06-29
2025-11-14 17:55:20,662 - INFO - Finished converting document 8-K_2023-06-29 in 0.05 sec.
2025-11-14 17:55:20,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,702 - INFO - Going to convert document batch...
2025-11-14 17:55:20,703 - INFO - Processing document 8-K_2023-07-14


Converted 'data\edgar_documents\WFC\8-K_2023-04-27' --> 'data\processed_data\WFC\8-K_2023-04-27.md'
Converted 'data\edgar_documents\WFC\8-K_2023-05-12' --> 'data\processed_data\WFC\8-K_2023-05-12.md'
Converted 'data\edgar_documents\WFC\8-K_2023-06-29' --> 'data\processed_data\WFC\8-K_2023-06-29.md'


2025-11-14 17:55:20,726 - INFO - Finished converting document 8-K_2023-07-14 in 0.05 sec.
2025-11-14 17:55:20,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,776 - INFO - Going to convert document batch...
2025-11-14 17:55:20,777 - INFO - Processing document 8-K_2023-07-24
2025-11-14 17:55:20,812 - INFO - Finished converting document 8-K_2023-07-24 in 0.08 sec.
2025-11-14 17:55:20,848 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,885 - INFO - Going to convert document batch...
2025-11-14 17:55:20,887 - INFO - Processing document 8-K_2023-07-25
2025-11-14 17:55:20,930 - INFO - Finished converting document 8-K_2023-07-25 in 0.09 sec.


Converted 'data\edgar_documents\WFC\8-K_2023-07-14' --> 'data\processed_data\WFC\8-K_2023-07-14.md'
Converted 'data\edgar_documents\WFC\8-K_2023-07-24' --> 'data\processed_data\WFC\8-K_2023-07-24.md'


2025-11-14 17:55:20,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:20,992 - INFO - Going to convert document batch...
2025-11-14 17:55:20,993 - INFO - Processing document 8-K_2023-08-10
2025-11-14 17:55:21,018 - INFO - Finished converting document 8-K_2023-08-10 in 0.06 sec.
2025-11-14 17:55:21,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,061 - INFO - Going to convert document batch...
2025-11-14 17:55:21,062 - INFO - Processing document 8-K_2023-09-18
2025-11-14 17:55:21,088 - INFO - Finished converting document 8-K_2023-09-18 in 0.06 sec.
2025-11-14 17:55:21,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,133 - INFO - Going to convert document batch...
2025-11-14 17:55:21,134 - INFO - Processing document 8-K_2023-10-13


Converted 'data\edgar_documents\WFC\8-K_2023-07-25' --> 'data\processed_data\WFC\8-K_2023-07-25.md'
Converted 'data\edgar_documents\WFC\8-K_2023-08-10' --> 'data\processed_data\WFC\8-K_2023-08-10.md'
Converted 'data\edgar_documents\WFC\8-K_2023-09-18' --> 'data\processed_data\WFC\8-K_2023-09-18.md'


2025-11-14 17:55:21,159 - INFO - Finished converting document 8-K_2023-10-13 in 0.06 sec.
2025-11-14 17:55:21,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,203 - INFO - Going to convert document batch...
2025-11-14 17:55:21,204 - INFO - Processing document 8-K_2023-10-23
2025-11-14 17:55:21,231 - INFO - Finished converting document 8-K_2023-10-23 in 0.06 sec.
2025-11-14 17:55:21,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,277 - INFO - Going to convert document batch...
2025-11-14 17:55:21,278 - INFO - Processing document 8-K_2023-12-13
2025-11-14 17:55:21,317 - INFO - Finished converting document 8-K_2023-12-13 in 0.06 sec.
2025-11-14 17:55:21,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WFC\8-K_2023-10-13' --> 'data\processed_data\WFC\8-K_2023-10-13.md'
Converted 'data\edgar_documents\WFC\8-K_2023-10-23' --> 'data\processed_data\WFC\8-K_2023-10-23.md'
Converted 'data\edgar_documents\WFC\8-K_2023-12-13' --> 'data\processed_data\WFC\8-K_2023-12-13.md'


2025-11-14 17:55:21,378 - INFO - Going to convert document batch...
2025-11-14 17:55:21,379 - INFO - Processing document 8-K_2024-01-12
2025-11-14 17:55:21,409 - INFO - Finished converting document 8-K_2024-01-12 in 0.08 sec.
2025-11-14 17:55:21,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,471 - INFO - Going to convert document batch...
2025-11-14 17:55:21,471 - INFO - Processing document 8-K_2024-01-23
2025-11-14 17:55:21,505 - INFO - Finished converting document 8-K_2024-01-23 in 0.06 sec.
2025-11-14 17:55:21,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,557 - INFO - Going to convert document batch...
2025-11-14 17:55:21,558 - INFO - Processing document 8-K_2024-01-24
2025-11-14 17:55:21,585 - INFO - Finished converting document 8-K_2024-01-24 in 0.06 sec.
2025-11-14 17:55:21,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,630 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\WFC\8-K_2024-01-12' --> 'data\processed_data\WFC\8-K_2024-01-12.md'
Converted 'data\edgar_documents\WFC\8-K_2024-01-23' --> 'data\processed_data\WFC\8-K_2024-01-23.md'
Converted 'data\edgar_documents\WFC\8-K_2024-01-24' --> 'data\processed_data\WFC\8-K_2024-01-24.md'


2025-11-14 17:55:21,631 - INFO - Processing document 8-K_2024-01-25
2025-11-14 17:55:21,653 - INFO - Finished converting document 8-K_2024-01-25 in 0.06 sec.
2025-11-14 17:55:21,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,701 - INFO - Going to convert document batch...
2025-11-14 17:55:21,703 - INFO - Processing document 8-K_2024-02-06
2025-11-14 17:55:21,750 - INFO - Finished converting document 8-K_2024-02-06 in 0.09 sec.
2025-11-14 17:55:21,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,808 - INFO - Going to convert document batch...
2025-11-14 17:55:21,809 - INFO - Processing document 8-K_2024-03-18
2025-11-14 17:55:21,837 - INFO - Finished converting document 8-K_2024-03-18 in 0.06 sec.


Converted 'data\edgar_documents\WFC\8-K_2024-01-25' --> 'data\processed_data\WFC\8-K_2024-01-25.md'
Converted 'data\edgar_documents\WFC\8-K_2024-02-06' --> 'data\processed_data\WFC\8-K_2024-02-06.md'


2025-11-14 17:55:21,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,883 - INFO - Going to convert document batch...
2025-11-14 17:55:21,884 - INFO - Processing document 8-K_2024-04-12
2025-11-14 17:55:21,908 - INFO - Finished converting document 8-K_2024-04-12 in 0.06 sec.
2025-11-14 17:55:21,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:21,956 - INFO - Going to convert document batch...
2025-11-14 17:55:21,957 - INFO - Processing document 8-K_2024-04-22
2025-11-14 17:55:21,987 - INFO - Finished converting document 8-K_2024-04-22 in 0.06 sec.
2025-11-14 17:55:22,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:22,032 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\WFC\8-K_2024-03-18' --> 'data\processed_data\WFC\8-K_2024-03-18.md'
Converted 'data\edgar_documents\WFC\8-K_2024-04-12' --> 'data\processed_data\WFC\8-K_2024-04-12.md'
Converted 'data\edgar_documents\WFC\8-K_2024-04-22' --> 'data\processed_data\WFC\8-K_2024-04-22.md'


2025-11-14 17:55:22,033 - INFO - Processing document 8-K_2024-04-23
2025-11-14 17:55:22,059 - INFO - Finished converting document 8-K_2024-04-23 in 0.06 sec.
2025-11-14 17:55:22,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:22,147 - INFO - Going to convert document batch...
2025-11-14 17:55:22,148 - INFO - Processing document 8-K_2024-05-02
2025-11-14 17:55:22,278 - INFO - Finished converting document 8-K_2024-05-02 in 0.20 sec.


Converted 'data\edgar_documents\WFC\8-K_2024-04-23' --> 'data\processed_data\WFC\8-K_2024-04-23.md'


2025-11-14 17:55:22,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:22,365 - INFO - Going to convert document batch...
2025-11-14 17:55:22,366 - INFO - Processing document 8-K_2024-05-09
2025-11-14 17:55:22,394 - INFO - Finished converting document 8-K_2024-05-09 in 0.06 sec.
2025-11-14 17:55:22,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:22,462 - INFO - Going to convert document batch...
2025-11-14 17:55:22,463 - INFO - Processing document 8-K_2024-06-18


Converted 'data\edgar_documents\WFC\8-K_2024-05-02' --> 'data\processed_data\WFC\8-K_2024-05-02.md'
Converted 'data\edgar_documents\WFC\8-K_2024-05-09' --> 'data\processed_data\WFC\8-K_2024-05-09.md'


2025-11-14 17:55:23,731 - INFO - Finished converting document 8-K_2024-06-18 in 1.33 sec.
2025-11-14 17:55:23,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:23,796 - INFO - Going to convert document batch...
2025-11-14 17:55:23,796 - INFO - Processing document 8-K_2024-07-12
2025-11-14 17:55:23,824 - INFO - Finished converting document 8-K_2024-07-12 in 0.08 sec.
2025-11-14 17:55:23,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:23,898 - INFO - Going to convert document batch...
2025-11-14 17:55:23,899 - INFO - Processing document 8-K_2024-07-23
2025-11-14 17:55:23,933 - INFO - Finished converting document 8-K_2024-07-23 in 0.09 sec.


Converted 'data\edgar_documents\WFC\8-K_2024-06-18' --> 'data\processed_data\WFC\8-K_2024-06-18.md'
Converted 'data\edgar_documents\WFC\8-K_2024-07-12' --> 'data\processed_data\WFC\8-K_2024-07-12.md'


2025-11-14 17:55:23,968 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:23,984 - INFO - Going to convert document batch...
2025-11-14 17:55:23,985 - INFO - Processing document 8-K_2024-09-12
2025-11-14 17:55:24,008 - INFO - Finished converting document 8-K_2024-09-12 in 0.05 sec.
2025-11-14 17:55:24,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,060 - INFO - Going to convert document batch...
2025-11-14 17:55:24,062 - INFO - Processing document 8-K_2024-10-11
2025-11-14 17:55:24,096 - INFO - Finished converting document 8-K_2024-10-11 in 0.08 sec.


Converted 'data\edgar_documents\WFC\8-K_2024-07-23' --> 'data\processed_data\WFC\8-K_2024-07-23.md'
Converted 'data\edgar_documents\WFC\8-K_2024-09-12' --> 'data\processed_data\WFC\8-K_2024-09-12.md'
Converted 'data\edgar_documents\WFC\8-K_2024-10-11' --> 'data\processed_data\WFC\8-K_2024-10-11.md'


2025-11-14 17:55:24,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,165 - INFO - Going to convert document batch...
2025-11-14 17:55:24,166 - INFO - Processing document 8-K_2024-12-03
2025-11-14 17:55:24,194 - INFO - Finished converting document 8-K_2024-12-03 in 0.08 sec.
2025-11-14 17:55:24,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,237 - INFO - Going to convert document batch...
2025-11-14 17:55:24,237 - INFO - Processing document 8-K_2025-01-15
2025-11-14 17:55:24,262 - INFO - Finished converting document 8-K_2025-01-15 in 0.06 sec.
2025-11-14 17:55:24,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,302 - INFO - Going to convert document batch...
2025-11-14 17:55:24,304 - INFO - Processing document 8-K_2025-01-24
2025-11-14 17:55:24,330 - INFO - Finished converting document 8-K_2025-01-24 in 0.06 sec.
2025-11-14 17:55:24,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\WFC\8-K_2024-12-03' --> 'data\processed_data\WFC\8-K_2024-12-03.md'
Converted 'data\edgar_documents\WFC\8-K_2025-01-15' --> 'data\processed_data\WFC\8-K_2025-01-15.md'
Converted 'data\edgar_documents\WFC\8-K_2025-01-24' --> 'data\processed_data\WFC\8-K_2025-01-24.md'


2025-11-14 17:55:24,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,425 - INFO - Going to convert document batch...
2025-11-14 17:55:24,426 - INFO - Processing document 8-K_2025-01-30
2025-11-14 17:55:24,445 - INFO - Finished converting document 8-K_2025-01-30 in 0.03 sec.
2025-11-14 17:55:24,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,485 - INFO - Going to convert document batch...
2025-11-14 17:55:24,486 - INFO - Processing document 8-K_2025-02-13
2025-11-14 17:55:24,508 - INFO - Finished converting document 8-K_2025-02-13 in 0.05 sec.
2025-11-14 17:55:24,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,568 - INFO - Going to convert document batch...
2025-11-14 17:55:24,568 - INFO - Processing document 8-K_2025-03-17
2025-11-14 17:55:24,589 - INFO - Finished converting document 8-K_2025-03-17 in 0.08 sec.


Converted 'data\edgar_documents\WFC\8-K_2025-01-28' --> 'data\processed_data\WFC\8-K_2025-01-28.md'
Converted 'data\edgar_documents\WFC\8-K_2025-01-30' --> 'data\processed_data\WFC\8-K_2025-01-30.md'
Converted 'data\edgar_documents\WFC\8-K_2025-02-13' --> 'data\processed_data\WFC\8-K_2025-02-13.md'


2025-11-14 17:55:24,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,624 - INFO - Going to convert document batch...
2025-11-14 17:55:24,625 - INFO - Processing document 8-K_2025-04-11
2025-11-14 17:55:24,661 - INFO - Finished converting document 8-K_2025-04-11 in 0.06 sec.
2025-11-14 17:55:24,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,727 - INFO - Going to convert document batch...
2025-11-14 17:55:24,728 - INFO - Processing document 8-K_2025-04-23
2025-11-14 17:55:24,757 - INFO - Finished converting document 8-K_2025-04-23 in 0.06 sec.
2025-11-14 17:55:24,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WFC\8-K_2025-03-17' --> 'data\processed_data\WFC\8-K_2025-03-17.md'
Converted 'data\edgar_documents\WFC\8-K_2025-04-11' --> 'data\processed_data\WFC\8-K_2025-04-11.md'
Converted 'data\edgar_documents\WFC\8-K_2025-04-23' --> 'data\processed_data\WFC\8-K_2025-04-23.md'


2025-11-14 17:55:24,800 - INFO - Going to convert document batch...
2025-11-14 17:55:24,801 - INFO - Processing document 8-K_2025-04-30
2025-11-14 17:55:24,822 - INFO - Finished converting document 8-K_2025-04-30 in 0.05 sec.
2025-11-14 17:55:24,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,880 - INFO - Going to convert document batch...
2025-11-14 17:55:24,880 - INFO - Processing document 8-K_2025-05-02
2025-11-14 17:55:24,925 - INFO - Finished converting document 8-K_2025-05-02 in 0.09 sec.
2025-11-14 17:55:24,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:24,972 - INFO - Going to convert document batch...
2025-11-14 17:55:24,973 - INFO - Processing document 8-K_2025-05-14
2025-11-14 17:55:24,997 - INFO - Finished converting document 8-K_2025-05-14 in 0.05 sec.


Converted 'data\edgar_documents\WFC\8-K_2025-04-30' --> 'data\processed_data\WFC\8-K_2025-04-30.md'
Converted 'data\edgar_documents\WFC\8-K_2025-05-02' --> 'data\processed_data\WFC\8-K_2025-05-02.md'
Converted 'data\edgar_documents\WFC\8-K_2025-05-14' --> 'data\processed_data\WFC\8-K_2025-05-14.md'


2025-11-14 17:55:25,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:25,064 - INFO - Going to convert document batch...
2025-11-14 17:55:25,065 - INFO - Processing document 8-K_2025-05-30
2025-11-14 17:55:25,086 - INFO - Finished converting document 8-K_2025-05-30 in 0.06 sec.
2025-11-14 17:55:25,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:25,128 - INFO - Going to convert document batch...
2025-11-14 17:55:25,129 - INFO - Processing document 8-K_2025-06-03
2025-11-14 17:55:25,149 - INFO - Finished converting document 8-K_2025-06-03 in 0.05 sec.
2025-11-14 17:55:25,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:25,210 - INFO - Going to convert document batch...
2025-11-14 17:55:25,213 - INFO - Processing document 8-K_2025-06-17
2025-11-14 17:55:25,261 - INFO - Finished converting document 8-K_2025-06-17 in 0.11 sec.
2025-11-14 17:55:25,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WFC\8-K_2025-05-30' --> 'data\processed_data\WFC\8-K_2025-05-30.md'
Converted 'data\edgar_documents\WFC\8-K_2025-06-03' --> 'data\processed_data\WFC\8-K_2025-06-03.md'
Converted 'data\edgar_documents\WFC\8-K_2025-06-17' --> 'data\processed_data\WFC\8-K_2025-06-17.md'


2025-11-14 17:55:25,303 - INFO - Going to convert document batch...
2025-11-14 17:55:25,304 - INFO - Processing document 8-K_2025-07-15
2025-11-14 17:55:25,325 - INFO - Finished converting document 8-K_2025-07-15 in 0.05 sec.
2025-11-14 17:55:25,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:25,366 - INFO - Going to convert document batch...
2025-11-14 17:55:25,367 - INFO - Processing document 8-K_2025-07-29
2025-11-14 17:55:25,394 - INFO - Finished converting document 8-K_2025-07-29 in 0.05 sec.
2025-11-14 17:55:25,419 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:25,435 - INFO - Going to convert document batch...
2025-11-14 17:55:25,435 - INFO - Processing document 8-K_2025-07-31
2025-11-14 17:55:25,463 - INFO - Finished converting document 8-K_2025-07-31 in 0.05 sec.
2025-11-14 17:55:25,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:25,507 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\WFC\8-K_2025-07-15' --> 'data\processed_data\WFC\8-K_2025-07-15.md'
Converted 'data\edgar_documents\WFC\8-K_2025-07-29' --> 'data\processed_data\WFC\8-K_2025-07-29.md'
Converted 'data\edgar_documents\WFC\8-K_2025-07-31' --> 'data\processed_data\WFC\8-K_2025-07-31.md'


2025-11-14 17:55:25,560 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:25,578 - INFO - Going to convert document batch...
2025-11-14 17:55:25,579 - INFO - Processing document 8-K_2025-09-15
2025-11-14 17:55:25,607 - INFO - Finished converting document 8-K_2025-09-15 in 0.06 sec.
2025-11-14 17:55:25,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:25,670 - INFO - Going to convert document batch...
2025-11-14 17:55:25,672 - INFO - Processing document 8-K_2025-10-14
2025-11-14 17:55:25,703 - INFO - Finished converting document 8-K_2025-10-14 in 0.08 sec.


Converted 'data\edgar_documents\WFC\8-K_2025-08-28' --> 'data\processed_data\WFC\8-K_2025-08-28.md'
Converted 'data\edgar_documents\WFC\8-K_2025-09-15' --> 'data\processed_data\WFC\8-K_2025-09-15.md'
Converted 'data\edgar_documents\WFC\8-K_2025-10-14' --> 'data\processed_data\WFC\8-K_2025-10-14.md'


2025-11-14 17:55:25,782 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:25,783 - ERROR - Input document DEF-14A_2023-03-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:25,786 - INFO - Going to convert document batch...
2025-11-14 17:55:25,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\WFC\DEF-14A_2023-03-15: File format not allowed: data\edgar_documents\WFC\DEF-14A_2023-03-15


2025-11-14 17:55:26,715 - INFO - Going to convert document batch...
2025-11-14 17:55:26,715 - INFO - Processing document DEF-14A_2024-03-18
2025-11-14 17:55:29,339 - INFO - Finished converting document DEF-14A_2024-03-18 in 3.56 sec.
2025-11-14 17:55:30,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WFC\DEF-14A_2024-03-18' --> 'data\processed_data\WFC\DEF-14A_2024-03-18.md'


2025-11-14 17:55:31,255 - INFO - Going to convert document batch...
2025-11-14 17:55:31,256 - INFO - Processing document DEF-14A_2025-03-19
2025-11-14 17:55:33,409 - INFO - Finished converting document DEF-14A_2025-03-19 in 2.97 sec.
2025-11-14 17:55:34,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WFC\DEF-14A_2025-03-19' --> 'data\processed_data\WFC\DEF-14A_2025-03-19.md'
Processed 142 new files. Errors: 181
Found 254 files to process in data\edgar_documents\WMT


2025-11-14 17:55:35,449 - INFO - Going to convert document batch...
2025-11-14 17:55:35,450 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:55:35,450 - INFO - Processing document 10-K_2023-03-17
2025-11-14 17:55:36,662 - INFO - Finished converting document 10-K_2023-03-17 in 2.25 sec.
2025-11-14 17:55:37,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-K_2023-03-17' --> 'data\processed_data\WMT\10-K_2023-03-17.md'


2025-11-14 17:55:37,952 - INFO - Going to convert document batch...
2025-11-14 17:55:37,953 - INFO - Processing document 10-K_2024-03-15
2025-11-14 17:55:39,035 - INFO - Finished converting document 10-K_2024-03-15 in 1.83 sec.
2025-11-14 17:55:39,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-K_2024-03-15' --> 'data\processed_data\WMT\10-K_2024-03-15.md'


2025-11-14 17:55:40,106 - INFO - Going to convert document batch...
2025-11-14 17:55:40,107 - INFO - Processing document 10-K_2025-03-14
2025-11-14 17:55:41,168 - INFO - Finished converting document 10-K_2025-03-14 in 1.59 sec.
2025-11-14 17:55:41,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-K_2025-03-14' --> 'data\processed_data\WMT\10-K_2025-03-14.md'


2025-11-14 17:55:42,430 - INFO - Going to convert document batch...
2025-11-14 17:55:42,431 - INFO - Processing document 10-Q_2023-06-02
2025-11-14 17:55:42,967 - INFO - Finished converting document 10-Q_2023-06-02 in 1.28 sec.
2025-11-14 17:55:43,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-Q_2023-06-02' --> 'data\processed_data\WMT\10-Q_2023-06-02.md'


2025-11-14 17:55:43,592 - INFO - Going to convert document batch...
2025-11-14 17:55:43,593 - INFO - Processing document 10-Q_2023-09-01
2025-11-14 17:55:44,216 - INFO - Finished converting document 10-Q_2023-09-01 in 0.97 sec.
2025-11-14 17:55:44,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-Q_2023-09-01' --> 'data\processed_data\WMT\10-Q_2023-09-01.md'


2025-11-14 17:55:45,210 - INFO - Going to convert document batch...
2025-11-14 17:55:45,211 - INFO - Processing document 10-Q_2023-11-30
2025-11-14 17:55:45,840 - INFO - Finished converting document 10-Q_2023-11-30 in 1.31 sec.
2025-11-14 17:55:46,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-Q_2023-11-30' --> 'data\processed_data\WMT\10-Q_2023-11-30.md'


2025-11-14 17:55:46,427 - INFO - Going to convert document batch...
2025-11-14 17:55:46,427 - INFO - Processing document 10-Q_2024-06-07
2025-11-14 17:55:46,948 - INFO - Finished converting document 10-Q_2024-06-07 in 0.80 sec.
2025-11-14 17:55:47,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-Q_2024-06-07' --> 'data\processed_data\WMT\10-Q_2024-06-07.md'


2025-11-14 17:55:47,793 - INFO - Going to convert document batch...
2025-11-14 17:55:47,794 - INFO - Processing document 10-Q_2024-08-30
2025-11-14 17:55:48,415 - INFO - Finished converting document 10-Q_2024-08-30 in 1.19 sec.
2025-11-14 17:55:48,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-Q_2024-08-30' --> 'data\processed_data\WMT\10-Q_2024-08-30.md'


2025-11-14 17:55:49,057 - INFO - Going to convert document batch...
2025-11-14 17:55:49,058 - INFO - Processing document 10-Q_2024-12-06
2025-11-14 17:55:49,667 - INFO - Finished converting document 10-Q_2024-12-06 in 0.97 sec.
2025-11-14 17:55:50,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-Q_2024-12-06' --> 'data\processed_data\WMT\10-Q_2024-12-06.md'


2025-11-14 17:55:50,518 - INFO - Going to convert document batch...
2025-11-14 17:55:50,519 - INFO - Processing document 10-Q_2025-06-06
2025-11-14 17:55:51,118 - INFO - Finished converting document 10-Q_2025-06-06 in 0.89 sec.
2025-11-14 17:55:51,460 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\10-Q_2025-06-06' --> 'data\processed_data\WMT\10-Q_2025-06-06.md'


2025-11-14 17:55:51,802 - INFO - Going to convert document batch...
2025-11-14 17:55:51,803 - INFO - Processing document 10-Q_2025-08-29
2025-11-14 17:55:52,659 - INFO - Finished converting document 10-Q_2025-08-29 in 1.23 sec.
2025-11-14 17:55:53,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,036 - INFO - Going to convert document batch...
2025-11-14 17:55:53,037 - INFO - Processing document 4_2023-01-04
2025-11-14 17:55:53,054 - INFO - Finished converting document 4_2023-01-04 in 0.06 sec.
2025-11-14 17:55:53,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,094 - INFO - Going to convert document batch...
2025-11-14 17:55:53,095 - INFO - Processing document 4_2023-01-05
2025-11-14 17:55:53,114 - INFO - Finished converting document 4_2023-01-05 in 0.03 sec.
2025-11-14 17:55:53,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,154 - INFO - Going to convert document batch...
2025-11-14 17:55:53,

Converted 'data\edgar_documents\WMT\10-Q_2025-08-29' --> 'data\processed_data\WMT\10-Q_2025-08-29.md'
Converted 'data\edgar_documents\WMT\4_2023-01-04' --> 'data\processed_data\WMT\4_2023-01-04.md'
Converted 'data\edgar_documents\WMT\4_2023-01-05' --> 'data\processed_data\WMT\4_2023-01-05.md'


2025-11-14 17:55:53,206 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,217 - INFO - Going to convert document batch...
2025-11-14 17:55:53,218 - INFO - Processing document 4_2023-01-27
2025-11-14 17:55:53,240 - INFO - Finished converting document 4_2023-01-27 in 0.05 sec.
2025-11-14 17:55:53,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,313 - INFO - Going to convert document batch...
2025-11-14 17:55:53,314 - INFO - Processing document 4_2023-02-02
2025-11-14 17:55:53,342 - INFO - Finished converting document 4_2023-02-02 in 0.08 sec.
2025-11-14 17:55:53,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2023-01-19' --> 'data\processed_data\WMT\4_2023-01-19.md'
Converted 'data\edgar_documents\WMT\4_2023-01-27' --> 'data\processed_data\WMT\4_2023-01-27.md'
Converted 'data\edgar_documents\WMT\4_2023-02-02' --> 'data\processed_data\WMT\4_2023-02-02.md'


2025-11-14 17:55:53,395 - INFO - Going to convert document batch...
2025-11-14 17:55:53,396 - INFO - Processing document 4_2023-02-16
2025-11-14 17:55:53,423 - INFO - Finished converting document 4_2023-02-16 in 0.06 sec.
2025-11-14 17:55:53,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,477 - INFO - Going to convert document batch...
2025-11-14 17:55:53,477 - INFO - Processing document 4_2023-02-23
2025-11-14 17:55:53,510 - INFO - Finished converting document 4_2023-02-23 in 0.06 sec.
2025-11-14 17:55:53,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,561 - INFO - Going to convert document batch...
2025-11-14 17:55:53,562 - INFO - Processing document 4_2023-02-24
2025-11-14 17:55:53,611 - INFO - Finished converting document 4_2023-02-24 in 0.08 sec.


Converted 'data\edgar_documents\WMT\4_2023-02-16' --> 'data\processed_data\WMT\4_2023-02-16.md'
Converted 'data\edgar_documents\WMT\4_2023-02-23' --> 'data\processed_data\WMT\4_2023-02-23.md'


2025-11-14 17:55:53,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,678 - INFO - Going to convert document batch...
2025-11-14 17:55:53,678 - INFO - Processing document 4_2023-03-01
2025-11-14 17:55:53,708 - INFO - Finished converting document 4_2023-03-01 in 0.05 sec.
2025-11-14 17:55:53,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,756 - INFO - Going to convert document batch...
2025-11-14 17:55:53,757 - INFO - Processing document 4_2023-03-02
2025-11-14 17:55:53,790 - INFO - Finished converting document 4_2023-03-02 in 0.05 sec.
2025-11-14 17:55:53,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2023-02-24' --> 'data\processed_data\WMT\4_2023-02-24.md'
Converted 'data\edgar_documents\WMT\4_2023-03-01' --> 'data\processed_data\WMT\4_2023-03-01.md'
Converted 'data\edgar_documents\WMT\4_2023-03-02' --> 'data\processed_data\WMT\4_2023-03-02.md'


2025-11-14 17:55:53,848 - INFO - Going to convert document batch...
2025-11-14 17:55:53,848 - INFO - Processing document 4_2023-03-03
2025-11-14 17:55:53,870 - INFO - Finished converting document 4_2023-03-03 in 0.06 sec.
2025-11-14 17:55:53,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,922 - INFO - Going to convert document batch...
2025-11-14 17:55:53,923 - INFO - Processing document 4_2023-03-08
2025-11-14 17:55:53,948 - INFO - Finished converting document 4_2023-03-08 in 0.06 sec.
2025-11-14 17:55:53,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:53,992 - INFO - Going to convert document batch...
2025-11-14 17:55:53,992 - INFO - Processing document 4_2023-03-10
2025-11-14 17:55:54,013 - INFO - Finished converting document 4_2023-03-10 in 0.05 sec.
2025-11-14 17:55:54,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:54,051 - INFO - Going to convert document batch...
2025-11-14 17:55:54,052 - 

Converted 'data\edgar_documents\WMT\4_2023-03-03' --> 'data\processed_data\WMT\4_2023-03-03.md'
Converted 'data\edgar_documents\WMT\4_2023-03-08' --> 'data\processed_data\WMT\4_2023-03-08.md'
Converted 'data\edgar_documents\WMT\4_2023-03-10' --> 'data\processed_data\WMT\4_2023-03-10.md'


2025-11-14 17:55:54,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:54,113 - INFO - Going to convert document batch...
2025-11-14 17:55:54,114 - INFO - Processing document 4_2023-03-15
2025-11-14 17:55:54,141 - INFO - Finished converting document 4_2023-03-15 in 0.05 sec.
2025-11-14 17:55:54,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:54,226 - INFO - Going to convert document batch...
2025-11-14 17:55:54,227 - INFO - Processing document 4_2023-03-16
2025-11-14 17:55:54,247 - INFO - Finished converting document 4_2023-03-16 in 0.06 sec.
2025-11-14 17:55:54,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2023-03-13' --> 'data\processed_data\WMT\4_2023-03-13.md'
Converted 'data\edgar_documents\WMT\4_2023-03-15' --> 'data\processed_data\WMT\4_2023-03-15.md'
Converted 'data\edgar_documents\WMT\4_2023-03-16' --> 'data\processed_data\WMT\4_2023-03-16.md'


2025-11-14 17:55:54,289 - INFO - Going to convert document batch...
2025-11-14 17:55:54,290 - INFO - Processing document 4_2023-03-17
2025-11-14 17:55:54,308 - INFO - Finished converting document 4_2023-03-17 in 0.05 sec.
2025-11-14 17:55:54,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:54,355 - INFO - Going to convert document batch...
2025-11-14 17:55:54,356 - INFO - Processing document 4_2023-03-22
2025-11-14 17:55:54,388 - INFO - Finished converting document 4_2023-03-22 in 0.06 sec.
2025-11-14 17:55:54,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:54,449 - INFO - Going to convert document batch...
2025-11-14 17:55:54,450 - INFO - Processing document 4_2023-03-24
2025-11-14 17:55:54,476 - INFO - Finished converting document 4_2023-03-24 in 0.05 sec.
2025-11-14 17:55:54,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2023-03-17' --> 'data\processed_data\WMT\4_2023-03-17.md'
Converted 'data\edgar_documents\WMT\4_2023-03-22' --> 'data\processed_data\WMT\4_2023-03-22.md'
Converted 'data\edgar_documents\WMT\4_2023-03-24' --> 'data\processed_data\WMT\4_2023-03-24.md'


2025-11-14 17:55:54,529 - INFO - Going to convert document batch...
2025-11-14 17:55:54,529 - INFO - Processing document 4_2023-03-29
2025-11-14 17:55:54,558 - INFO - Finished converting document 4_2023-03-29 in 0.06 sec.
2025-11-14 17:55:54,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:54,616 - INFO - Going to convert document batch...
2025-11-14 17:55:54,616 - INFO - Processing document 4_2023-03-30
2025-11-14 17:55:54,640 - INFO - Finished converting document 4_2023-03-30 in 0.05 sec.
2025-11-14 17:55:54,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:54,690 - INFO - Going to convert document batch...
2025-11-14 17:55:54,691 - INFO - Processing document 4_2023-04-04
2025-11-14 17:55:54,713 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.
2025-11-14 17:55:54,764 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:54,765 - ERROR - Input document 4_2023-04-12 with format None does 

Converted 'data\edgar_documents\WMT\4_2023-03-29' --> 'data\processed_data\WMT\4_2023-03-29.md'
Converted 'data\edgar_documents\WMT\4_2023-03-30' --> 'data\processed_data\WMT\4_2023-03-30.md'
Converted 'data\edgar_documents\WMT\4_2023-04-04' --> 'data\processed_data\WMT\4_2023-04-04.md'
Error processing data\edgar_documents\WMT\4_2023-04-12: File format not allowed: data\edgar_documents\WMT\4_2023-04-12


2025-11-14 17:55:54,792 - INFO - Going to convert document batch...
2025-11-14 17:55:54,793 - INFO - Processing document 4_2023-04-13
2025-11-14 17:55:54,815 - INFO - Finished converting document 4_2023-04-13 in 0.05 sec.
2025-11-14 17:55:54,866 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:55:54,867 - ERROR - Input document 4_2023-04-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:55:54,868 - INFO - Going to convert document batch...
2025-11-14 17:55:54,892 - IN

Converted 'data\edgar_documents\WMT\4_2023-04-13' --> 'data\processed_data\WMT\4_2023-04-13.md'
Error processing data\edgar_documents\WMT\4_2023-04-14: File format not allowed: data\edgar_documents\WMT\4_2023-04-14
Converted 'data\edgar_documents\WMT\4_2023-05-01' --> 'data\processed_data\WMT\4_2023-05-01.md'


2025-11-14 17:55:55,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,052 - INFO - Going to convert document batch...
2025-11-14 17:55:55,053 - INFO - Processing document 4_2023-05-23
2025-11-14 17:55:55,079 - INFO - Finished converting document 4_2023-05-23 in 0.05 sec.
2025-11-14 17:55:55,124 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,132 - INFO - Going to convert document batch...
2025-11-14 17:55:55,133 - INFO - Processing document 4_2023-05-25
2025-11-14 17:55:55,153 - INFO - Finished converting document 4_2023-05-25 in 0.05 sec.
2025-11-14 17:55:55,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,198 - INFO - Going to convert document batch...
2025-11-14 17:55:55,199 - INFO - Processing document 4_2023-06-02
2025-11-14 17:55:55,219 - INFO - Finished converting document 4_2023-06-02 in 0.05 sec.


Converted 'data\edgar_documents\WMT\4_2023-05-11' --> 'data\processed_data\WMT\4_2023-05-11.md'
Converted 'data\edgar_documents\WMT\4_2023-05-23' --> 'data\processed_data\WMT\4_2023-05-23.md'
Converted 'data\edgar_documents\WMT\4_2023-05-25' --> 'data\processed_data\WMT\4_2023-05-25.md'


2025-11-14 17:55:55,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,277 - INFO - Going to convert document batch...
2025-11-14 17:55:55,278 - INFO - Processing document 4_2023-06-07
2025-11-14 17:55:55,301 - INFO - Finished converting document 4_2023-06-07 in 0.05 sec.
2025-11-14 17:55:55,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,352 - INFO - Going to convert document batch...
2025-11-14 17:55:55,353 - INFO - Processing document 4_2023-06-09
2025-11-14 17:55:55,385 - INFO - Finished converting document 4_2023-06-09 in 0.06 sec.


Converted 'data\edgar_documents\WMT\4_2023-06-02' --> 'data\processed_data\WMT\4_2023-06-02.md'
Converted 'data\edgar_documents\WMT\4_2023-06-07' --> 'data\processed_data\WMT\4_2023-06-07.md'
Converted 'data\edgar_documents\WMT\4_2023-06-09' --> 'data\processed_data\WMT\4_2023-06-09.md'


2025-11-14 17:55:55,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,464 - INFO - Going to convert document batch...
2025-11-14 17:55:55,465 - INFO - Processing document 4_2023-06-16
2025-11-14 17:55:55,506 - INFO - Finished converting document 4_2023-06-16 in 0.08 sec.
2025-11-14 17:55:55,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,593 - INFO - Going to convert document batch...
2025-11-14 17:55:55,594 - INFO - Processing document 4_2023-06-22
2025-11-14 17:55:55,621 - INFO - Finished converting document 4_2023-06-22 in 0.06 sec.
2025-11-14 17:55:55,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,669 - INFO - Going to convert document batch...
2025-11-14 17:55:55,669 - INFO - Processing document 4_2023-06-23
2025-11-14 17:55:55,688 - INFO - Finished converting document 4_2023-06-23 in 0.03 sec.
2025-11-14 17:55:55,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\WMT\4_2023-06-16' --> 'data\processed_data\WMT\4_2023-06-16.md'
Converted 'data\edgar_documents\WMT\4_2023-06-22' --> 'data\processed_data\WMT\4_2023-06-22.md'
Converted 'data\edgar_documents\WMT\4_2023-06-23' --> 'data\processed_data\WMT\4_2023-06-23.md'


2025-11-14 17:55:55,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,797 - INFO - Going to convert document batch...
2025-11-14 17:55:55,798 - INFO - Processing document 4_2023-06-29
2025-11-14 17:55:55,829 - INFO - Finished converting document 4_2023-06-29 in 0.06 sec.
2025-11-14 17:55:55,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,892 - INFO - Going to convert document batch...
2025-11-14 17:55:55,893 - INFO - Processing document 4_2023-06-30
2025-11-14 17:55:55,914 - INFO - Finished converting document 4_2023-06-30 in 0.05 sec.


Converted 'data\edgar_documents\WMT\4_2023-06-28' --> 'data\processed_data\WMT\4_2023-06-28.md'
Converted 'data\edgar_documents\WMT\4_2023-06-29' --> 'data\processed_data\WMT\4_2023-06-29.md'
Converted 'data\edgar_documents\WMT\4_2023-06-30' --> 'data\processed_data\WMT\4_2023-06-30.md'


2025-11-14 17:55:55,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:55,959 - INFO - Going to convert document batch...
2025-11-14 17:55:55,960 - INFO - Processing document 4_2023-07-05
2025-11-14 17:55:55,979 - INFO - Finished converting document 4_2023-07-05 in 0.05 sec.
2025-11-14 17:55:56,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,028 - INFO - Going to convert document batch...
2025-11-14 17:55:56,029 - INFO - Processing document 4_2023-07-06
2025-11-14 17:55:56,053 - INFO - Finished converting document 4_2023-07-06 in 0.05 sec.
2025-11-14 17:55:56,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,099 - INFO - Going to convert document batch...
2025-11-14 17:55:56,100 - INFO - Processing document 4_2023-07-20
2025-11-14 17:55:56,118 - INFO - Finished converting document 4_2023-07-20 in 0.03 sec.
2025-11-14 17:55:56,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\WMT\4_2023-07-05' --> 'data\processed_data\WMT\4_2023-07-05.md'
Converted 'data\edgar_documents\WMT\4_2023-07-06' --> 'data\processed_data\WMT\4_2023-07-06.md'
Converted 'data\edgar_documents\WMT\4_2023-07-20' --> 'data\processed_data\WMT\4_2023-07-20.md'


2025-11-14 17:55:56,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,225 - INFO - Going to convert document batch...
2025-11-14 17:55:56,226 - INFO - Processing document 4_2023-08-03
2025-11-14 17:55:56,245 - INFO - Finished converting document 4_2023-08-03 in 0.05 sec.
2025-11-14 17:55:56,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,303 - INFO - Going to convert document batch...
2025-11-14 17:55:56,305 - INFO - Processing document 4_2023-08-17
2025-11-14 17:55:56,335 - INFO - Finished converting document 4_2023-08-17 in 0.06 sec.
2025-11-14 17:55:56,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2023-07-28' --> 'data\processed_data\WMT\4_2023-07-28.md'
Converted 'data\edgar_documents\WMT\4_2023-08-03' --> 'data\processed_data\WMT\4_2023-08-03.md'
Converted 'data\edgar_documents\WMT\4_2023-08-17' --> 'data\processed_data\WMT\4_2023-08-17.md'


2025-11-14 17:55:56,397 - INFO - Going to convert document batch...
2025-11-14 17:55:56,398 - INFO - Processing document 4_2023-08-25
2025-11-14 17:55:56,417 - INFO - Finished converting document 4_2023-08-25 in 0.06 sec.
2025-11-14 17:55:56,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,462 - INFO - Going to convert document batch...
2025-11-14 17:55:56,463 - INFO - Processing document 4_2023-09-06
2025-11-14 17:55:56,484 - INFO - Finished converting document 4_2023-09-06 in 0.05 sec.
2025-11-14 17:55:56,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,526 - INFO - Going to convert document batch...
2025-11-14 17:55:56,527 - INFO - Processing document 4_2023-09-14
2025-11-14 17:55:56,545 - INFO - Finished converting document 4_2023-09-14 in 0.05 sec.
2025-11-14 17:55:56,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,585 - INFO - Going to convert document batch...
2025-11-14 17:55:56,585 - 

Converted 'data\edgar_documents\WMT\4_2023-08-25' --> 'data\processed_data\WMT\4_2023-08-25.md'
Converted 'data\edgar_documents\WMT\4_2023-09-06' --> 'data\processed_data\WMT\4_2023-09-06.md'
Converted 'data\edgar_documents\WMT\4_2023-09-14' --> 'data\processed_data\WMT\4_2023-09-14.md'


2025-11-14 17:55:56,637 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,644 - INFO - Going to convert document batch...
2025-11-14 17:55:56,645 - INFO - Processing document 4_2023-10-03
2025-11-14 17:55:56,663 - INFO - Finished converting document 4_2023-10-03 in 0.03 sec.
2025-11-14 17:55:56,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,711 - INFO - Going to convert document batch...
2025-11-14 17:55:56,713 - INFO - Processing document 4_2023-10-04
2025-11-14 17:55:56,745 - INFO - Finished converting document 4_2023-10-04 in 0.06 sec.
2025-11-14 17:55:56,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,797 - INFO - Going to convert document batch...
2025-11-14 17:55:56,798 - INFO - Processing document 4_2023-10-12
2025-11-14 17:55:56,817 - INFO - Finished converting document 4_2023-10-12 in 0.03 sec.


Converted 'data\edgar_documents\WMT\4_2023-09-29' --> 'data\processed_data\WMT\4_2023-09-29.md'
Converted 'data\edgar_documents\WMT\4_2023-10-03' --> 'data\processed_data\WMT\4_2023-10-03.md'
Converted 'data\edgar_documents\WMT\4_2023-10-04' --> 'data\processed_data\WMT\4_2023-10-04.md'


2025-11-14 17:55:56,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,857 - INFO - Going to convert document batch...
2025-11-14 17:55:56,858 - INFO - Processing document 4_2023-10-26
2025-11-14 17:55:56,877 - INFO - Finished converting document 4_2023-10-26 in 0.03 sec.
2025-11-14 17:55:56,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,919 - INFO - Going to convert document batch...
2025-11-14 17:55:56,919 - INFO - Processing document 4_2023-10-27
2025-11-14 17:55:56,940 - INFO - Finished converting document 4_2023-10-27 in 0.05 sec.
2025-11-14 17:55:56,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:56,982 - INFO - Going to convert document batch...
2025-11-14 17:55:56,982 - INFO - Processing document 4_2023-11-03
2025-11-14 17:55:57,003 - INFO - Finished converting document 4_2023-11-03 in 0.05 sec.
2025-11-14 17:55:57,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2023-10-12' --> 'data\processed_data\WMT\4_2023-10-12.md'
Converted 'data\edgar_documents\WMT\4_2023-10-26' --> 'data\processed_data\WMT\4_2023-10-26.md'
Converted 'data\edgar_documents\WMT\4_2023-10-27' --> 'data\processed_data\WMT\4_2023-10-27.md'
Converted 'data\edgar_documents\WMT\4_2023-11-03' --> 'data\processed_data\WMT\4_2023-11-03.md'


2025-11-14 17:55:57,045 - INFO - Going to convert document batch...
2025-11-14 17:55:57,046 - INFO - Processing document 4_2023-11-09
2025-11-14 17:55:57,066 - INFO - Finished converting document 4_2023-11-09 in 0.05 sec.
2025-11-14 17:55:57,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:57,111 - INFO - Going to convert document batch...
2025-11-14 17:55:57,112 - INFO - Processing document 4_2023-11-21
2025-11-14 17:55:57,142 - INFO - Finished converting document 4_2023-11-21 in 0.06 sec.
2025-11-14 17:55:57,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:57,191 - INFO - Going to convert document batch...
2025-11-14 17:55:57,192 - INFO - Processing document 4_2023-11-24
2025-11-14 17:55:57,216 - INFO - Finished converting document 4_2023-11-24 in 0.05 sec.
2025-11-14 17:55:57,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:57,261 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\WMT\4_2023-11-09' --> 'data\processed_data\WMT\4_2023-11-09.md'
Converted 'data\edgar_documents\WMT\4_2023-11-21' --> 'data\processed_data\WMT\4_2023-11-21.md'
Converted 'data\edgar_documents\WMT\4_2023-11-24' --> 'data\processed_data\WMT\4_2023-11-24.md'


2025-11-14 17:55:57,262 - INFO - Processing document 4_2023-11-29
2025-11-14 17:55:57,281 - INFO - Finished converting document 4_2023-11-29 in 0.05 sec.
2025-11-14 17:55:57,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:57,339 - INFO - Going to convert document batch...
2025-11-14 17:55:57,341 - INFO - Processing document 4_2023-12-01
2025-11-14 17:55:57,383 - INFO - Finished converting document 4_2023-12-01 in 0.08 sec.
2025-11-14 17:55:57,422 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:57,439 - INFO - Going to convert document batch...
2025-11-14 17:55:57,440 - INFO - Processing document 4_2023-12-05
2025-11-14 17:55:57,462 - INFO - Finished converting document 4_2023-12-05 in 0.05 sec.


Converted 'data\edgar_documents\WMT\4_2023-11-29' --> 'data\processed_data\WMT\4_2023-11-29.md'
Converted 'data\edgar_documents\WMT\4_2023-12-01' --> 'data\processed_data\WMT\4_2023-12-01.md'


2025-11-14 17:55:57,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:57,507 - INFO - Going to convert document batch...
2025-11-14 17:55:57,508 - INFO - Processing document 4_2023-12-07
2025-11-14 17:55:57,526 - INFO - Finished converting document 4_2023-12-07 in 0.05 sec.
2025-11-14 17:55:57,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:57,569 - INFO - Going to convert document batch...
2025-11-14 17:55:57,570 - INFO - Processing document 4_2023-12-08


Converted 'data\edgar_documents\WMT\4_2023-12-05' --> 'data\processed_data\WMT\4_2023-12-05.md'
Converted 'data\edgar_documents\WMT\4_2023-12-07' --> 'data\processed_data\WMT\4_2023-12-07.md'


2025-11-14 17:55:57,931 - INFO - Finished converting document 4_2023-12-08 in 0.38 sec.
2025-11-14 17:55:57,968 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:57,976 - INFO - Going to convert document batch...
2025-11-14 17:55:57,976 - INFO - Processing document 4_2023-12-14
2025-11-14 17:55:57,997 - INFO - Finished converting document 4_2023-12-14 in 0.05 sec.
2025-11-14 17:55:58,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,052 - INFO - Going to convert document batch...
2025-11-14 17:55:58,053 - INFO - Processing document 4_2023-12-20
2025-11-14 17:55:58,086 - INFO - Finished converting document 4_2023-12-20 in 0.06 sec.
2025-11-14 17:55:58,121 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,129 - INFO - Going to convert document batch...
2025-11-14 17:55:58,130 - INFO - Processing document 4_2023-12-21
2025-11-14 17:55:58,148 - INFO - Finished converting document 4_2023-12-21 in 0.03 sec.


Converted 'data\edgar_documents\WMT\4_2023-12-08' --> 'data\processed_data\WMT\4_2023-12-08.md'
Converted 'data\edgar_documents\WMT\4_2023-12-14' --> 'data\processed_data\WMT\4_2023-12-14.md'
Converted 'data\edgar_documents\WMT\4_2023-12-20' --> 'data\processed_data\WMT\4_2023-12-20.md'


2025-11-14 17:55:58,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,189 - INFO - Going to convert document batch...
2025-11-14 17:55:58,190 - INFO - Processing document 4_2023-12-22
2025-11-14 17:55:58,211 - INFO - Finished converting document 4_2023-12-22 in 0.03 sec.
2025-11-14 17:55:58,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,260 - INFO - Going to convert document batch...
2025-11-14 17:55:58,260 - INFO - Processing document 4_2023-12-29
2025-11-14 17:55:58,284 - INFO - Finished converting document 4_2023-12-29 in 0.05 sec.
2025-11-14 17:55:58,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,330 - INFO - Going to convert document batch...
2025-11-14 17:55:58,331 - INFO - Processing document 4_2024-01-03
2025-11-14 17:55:58,350 - INFO - Finished converting document 4_2024-01-03 in 0.03 sec.


Converted 'data\edgar_documents\WMT\4_2023-12-21' --> 'data\processed_data\WMT\4_2023-12-21.md'
Converted 'data\edgar_documents\WMT\4_2023-12-22' --> 'data\processed_data\WMT\4_2023-12-22.md'
Converted 'data\edgar_documents\WMT\4_2023-12-29' --> 'data\processed_data\WMT\4_2023-12-29.md'
Converted 'data\edgar_documents\WMT\4_2024-01-03' --> 'data\processed_data\WMT\4_2024-01-03.md'


2025-11-14 17:55:58,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,392 - INFO - Going to convert document batch...
2025-11-14 17:55:58,392 - INFO - Processing document 4_2024-01-04
2025-11-14 17:55:58,415 - INFO - Finished converting document 4_2024-01-04 in 0.03 sec.
2025-11-14 17:55:58,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,488 - INFO - Going to convert document batch...
2025-11-14 17:55:58,489 - INFO - Processing document 4_2024-01-16
2025-11-14 17:55:58,514 - INFO - Finished converting document 4_2024-01-16 in 0.06 sec.
2025-11-14 17:55:58,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,556 - INFO - Going to convert document batch...
2025-11-14 17:55:58,557 - INFO - Processing document 4_2024-01-18
2025-11-14 17:55:58,577 - INFO - Finished converting document 4_2024-01-18 in 0.05 sec.
2025-11-14 17:55:58,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\WMT\4_2024-01-04' --> 'data\processed_data\WMT\4_2024-01-04.md'
Converted 'data\edgar_documents\WMT\4_2024-01-16' --> 'data\processed_data\WMT\4_2024-01-16.md'
Converted 'data\edgar_documents\WMT\4_2024-01-18' --> 'data\processed_data\WMT\4_2024-01-18.md'


2025-11-14 17:55:58,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,685 - INFO - Going to convert document batch...
2025-11-14 17:55:58,685 - INFO - Processing document 4_2024-02-02
2025-11-14 17:55:58,706 - INFO - Finished converting document 4_2024-02-02 in 0.05 sec.
2025-11-14 17:55:58,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,751 - INFO - Going to convert document batch...
2025-11-14 17:55:58,752 - INFO - Processing document 4_2024-02-05
2025-11-14 17:55:58,775 - INFO - Finished converting document 4_2024-02-05 in 0.03 sec.
2025-11-14 17:55:58,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,815 - INFO - Going to convert document batch...
2025-11-14 17:55:58,815 - INFO - Processing document 4_2024-02-14
2025-11-14 17:55:58,833 - INFO - Finished converting document 4_2024-02-14 in 0.03 sec.
2025-11-14 17:55:58,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2024-01-26' --> 'data\processed_data\WMT\4_2024-01-26.md'
Converted 'data\edgar_documents\WMT\4_2024-02-02' --> 'data\processed_data\WMT\4_2024-02-02.md'
Converted 'data\edgar_documents\WMT\4_2024-02-05' --> 'data\processed_data\WMT\4_2024-02-05.md'
Converted 'data\edgar_documents\WMT\4_2024-02-14' --> 'data\processed_data\WMT\4_2024-02-14.md'


2025-11-14 17:55:58,879 - INFO - Going to convert document batch...
2025-11-14 17:55:58,880 - INFO - Processing document 4_2024-02-23
2025-11-14 17:55:58,912 - INFO - Finished converting document 4_2024-02-23 in 0.05 sec.
2025-11-14 17:55:58,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:58,967 - INFO - Going to convert document batch...
2025-11-14 17:55:58,968 - INFO - Processing document 4_2024-02-28
2025-11-14 17:55:58,987 - INFO - Finished converting document 4_2024-02-28 in 0.05 sec.
2025-11-14 17:55:59,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,028 - INFO - Going to convert document batch...
2025-11-14 17:55:59,028 - INFO - Processing document 4_2024-03-01
2025-11-14 17:55:59,045 - INFO - Finished converting document 4_2024-03-01 in 0.05 sec.
2025-11-14 17:55:59,076 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,084 - INFO - Going to convert document batch...
2025-11-14 17:55:59,085 - 

Converted 'data\edgar_documents\WMT\4_2024-02-23' --> 'data\processed_data\WMT\4_2024-02-23.md'
Converted 'data\edgar_documents\WMT\4_2024-02-28' --> 'data\processed_data\WMT\4_2024-02-28.md'
Converted 'data\edgar_documents\WMT\4_2024-03-01' --> 'data\processed_data\WMT\4_2024-03-01.md'
Converted 'data\edgar_documents\WMT\4_2024-03-05' --> 'data\processed_data\WMT\4_2024-03-05.md'


2025-11-14 17:55:59,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,169 - INFO - Going to convert document batch...
2025-11-14 17:55:59,170 - INFO - Processing document 4_2024-03-06
2025-11-14 17:55:59,187 - INFO - Finished converting document 4_2024-03-06 in 0.06 sec.
2025-11-14 17:55:59,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,233 - INFO - Going to convert document batch...
2025-11-14 17:55:59,234 - INFO - Processing document 4_2024-03-14
2025-11-14 17:55:59,257 - INFO - Finished converting document 4_2024-03-14 in 0.05 sec.
2025-11-14 17:55:59,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,298 - INFO - Going to convert document batch...
2025-11-14 17:55:59,299 - INFO - Processing document 4_2024-04-01
2025-11-14 17:55:59,318 - INFO - Finished converting document 4_2024-04-01 in 0.03 sec.
2025-11-14 17:55:59,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\WMT\4_2024-03-06' --> 'data\processed_data\WMT\4_2024-03-06.md'
Converted 'data\edgar_documents\WMT\4_2024-03-14' --> 'data\processed_data\WMT\4_2024-03-14.md'
Converted 'data\edgar_documents\WMT\4_2024-04-01' --> 'data\processed_data\WMT\4_2024-04-01.md'
Converted 'data\edgar_documents\WMT\4_2024-04-02' --> 'data\processed_data\WMT\4_2024-04-02.md'


2025-11-14 17:55:59,417 - INFO - Going to convert document batch...
2025-11-14 17:55:59,417 - INFO - Processing document 4_2024-04-11
2025-11-14 17:55:59,435 - INFO - Finished converting document 4_2024-04-11 in 0.05 sec.
2025-11-14 17:55:59,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,477 - INFO - Going to convert document batch...
2025-11-14 17:55:59,478 - INFO - Processing document 4_2024-04-29
2025-11-14 17:55:59,525 - INFO - Finished converting document 4_2024-04-29 in 0.06 sec.
2025-11-14 17:55:59,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,574 - INFO - Going to convert document batch...
2025-11-14 17:55:59,574 - INFO - Processing document 4_2024-05-03
2025-11-14 17:55:59,592 - INFO - Finished converting document 4_2024-05-03 in 0.05 sec.
2025-11-14 17:55:59,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,630 - INFO - Going to convert document batch...
2025-11-14 17:55:59,631 - 

Converted 'data\edgar_documents\WMT\4_2024-04-11' --> 'data\processed_data\WMT\4_2024-04-11.md'
Converted 'data\edgar_documents\WMT\4_2024-04-29' --> 'data\processed_data\WMT\4_2024-04-29.md'
Converted 'data\edgar_documents\WMT\4_2024-05-03' --> 'data\processed_data\WMT\4_2024-05-03.md'


2025-11-14 17:55:59,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,688 - INFO - Going to convert document batch...
2025-11-14 17:55:59,688 - INFO - Processing document 4_2024-05-21
2025-11-14 17:55:59,707 - INFO - Finished converting document 4_2024-05-21 in 0.03 sec.
2025-11-14 17:55:59,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,760 - INFO - Going to convert document batch...
2025-11-14 17:55:59,761 - INFO - Processing document 4_2024-05-23
2025-11-14 17:55:59,781 - INFO - Finished converting document 4_2024-05-23 in 0.05 sec.
2025-11-14 17:55:59,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,823 - INFO - Going to convert document batch...
2025-11-14 17:55:59,824 - INFO - Processing document 4_2024-05-24
2025-11-14 17:55:59,847 - INFO - Finished converting document 4_2024-05-24 in 0.05 sec.


Converted 'data\edgar_documents\WMT\4_2024-05-09' --> 'data\processed_data\WMT\4_2024-05-09.md'
Converted 'data\edgar_documents\WMT\4_2024-05-21' --> 'data\processed_data\WMT\4_2024-05-21.md'
Converted 'data\edgar_documents\WMT\4_2024-05-23' --> 'data\processed_data\WMT\4_2024-05-23.md'
Converted 'data\edgar_documents\WMT\4_2024-05-24' --> 'data\processed_data\WMT\4_2024-05-24.md'


2025-11-14 17:55:59,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:55:59,907 - INFO - Going to convert document batch...
2025-11-14 17:55:59,908 - INFO - Processing document 4_2024-05-30
2025-11-14 17:55:59,929 - INFO - Finished converting document 4_2024-05-30 in 0.05 sec.
2025-11-14 17:55:59,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,009 - INFO - Going to convert document batch...
2025-11-14 17:56:00,010 - INFO - Processing document 4_2024-06-05
2025-11-14 17:56:00,036 - INFO - Finished converting document 4_2024-06-05 in 0.06 sec.
2025-11-14 17:56:00,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,105 - INFO - Going to convert document batch...
2025-11-14 17:56:00,106 - INFO - Processing document 4_2024-06-06
2025-11-14 17:56:00,128 - INFO - Finished converting document 4_2024-06-06 in 0.06 sec.


Converted 'data\edgar_documents\WMT\4_2024-05-30' --> 'data\processed_data\WMT\4_2024-05-30.md'
Converted 'data\edgar_documents\WMT\4_2024-06-05' --> 'data\processed_data\WMT\4_2024-06-05.md'


2025-11-14 17:56:00,167 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,179 - INFO - Going to convert document batch...
2025-11-14 17:56:00,180 - INFO - Processing document 4_2024-06-07
2025-11-14 17:56:00,208 - INFO - Finished converting document 4_2024-06-07 in 0.05 sec.
2025-11-14 17:56:00,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,260 - INFO - Going to convert document batch...
2025-11-14 17:56:00,261 - INFO - Processing document 4_2024-06-12
2025-11-14 17:56:00,288 - INFO - Finished converting document 4_2024-06-12 in 0.05 sec.
2025-11-14 17:56:00,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,338 - INFO - Going to convert document batch...
2025-11-14 17:56:00,338 - INFO - Processing document 4_2024-06-14


Converted 'data\edgar_documents\WMT\4_2024-06-06' --> 'data\processed_data\WMT\4_2024-06-06.md'
Converted 'data\edgar_documents\WMT\4_2024-06-07' --> 'data\processed_data\WMT\4_2024-06-07.md'
Converted 'data\edgar_documents\WMT\4_2024-06-12' --> 'data\processed_data\WMT\4_2024-06-12.md'


2025-11-14 17:56:00,362 - INFO - Finished converting document 4_2024-06-14 in 0.05 sec.
2025-11-14 17:56:00,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,420 - INFO - Going to convert document batch...
2025-11-14 17:56:00,422 - INFO - Processing document 4_2024-06-20
2025-11-14 17:56:00,460 - INFO - Finished converting document 4_2024-06-20 in 0.06 sec.
2025-11-14 17:56:00,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,517 - INFO - Going to convert document batch...
2025-11-14 17:56:00,519 - INFO - Processing document 4_2024-06-26
2025-11-14 17:56:00,549 - INFO - Finished converting document 4_2024-06-26 in 0.06 sec.


Converted 'data\edgar_documents\WMT\4_2024-06-14' --> 'data\processed_data\WMT\4_2024-06-14.md'
Converted 'data\edgar_documents\WMT\4_2024-06-20' --> 'data\processed_data\WMT\4_2024-06-20.md'


2025-11-14 17:56:00,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,602 - INFO - Going to convert document batch...
2025-11-14 17:56:00,603 - INFO - Processing document 4_2024-06-28
2025-11-14 17:56:00,632 - INFO - Finished converting document 4_2024-06-28 in 0.05 sec.
2025-11-14 17:56:00,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,679 - INFO - Going to convert document batch...
2025-11-14 17:56:00,680 - INFO - Processing document 4_2024-07-02
2025-11-14 17:56:00,702 - INFO - Finished converting document 4_2024-07-02 in 0.05 sec.
2025-11-14 17:56:00,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,745 - INFO - Going to convert document batch...
2025-11-14 17:56:00,746 - INFO - Processing document 4_2024-07-05
2025-11-14 17:56:00,765 - INFO - Finished converting document 4_2024-07-05 in 0.05 sec.


Converted 'data\edgar_documents\WMT\4_2024-06-26' --> 'data\processed_data\WMT\4_2024-06-26.md'
Converted 'data\edgar_documents\WMT\4_2024-06-28' --> 'data\processed_data\WMT\4_2024-06-28.md'
Converted 'data\edgar_documents\WMT\4_2024-07-02' --> 'data\processed_data\WMT\4_2024-07-02.md'


2025-11-14 17:56:00,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,808 - INFO - Going to convert document batch...
2025-11-14 17:56:00,808 - INFO - Processing document 4_2024-07-17
2025-11-14 17:56:00,827 - INFO - Finished converting document 4_2024-07-17 in 0.05 sec.
2025-11-14 17:56:00,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,869 - INFO - Going to convert document batch...
2025-11-14 17:56:00,870 - INFO - Processing document 4_2024-07-19
2025-11-14 17:56:00,889 - INFO - Finished converting document 4_2024-07-19 in 0.05 sec.
2025-11-14 17:56:00,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:00,933 - INFO - Going to convert document batch...
2025-11-14 17:56:00,934 - INFO - Processing document 4_2024-07-26
2025-11-14 17:56:00,954 - INFO - Finished converting document 4_2024-07-26 in 0.05 sec.


Converted 'data\edgar_documents\WMT\4_2024-07-05' --> 'data\processed_data\WMT\4_2024-07-05.md'
Converted 'data\edgar_documents\WMT\4_2024-07-17' --> 'data\processed_data\WMT\4_2024-07-17.md'
Converted 'data\edgar_documents\WMT\4_2024-07-19' --> 'data\processed_data\WMT\4_2024-07-19.md'


2025-11-14 17:56:01,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,023 - INFO - Going to convert document batch...
2025-11-14 17:56:01,023 - INFO - Processing document 4_2024-08-01
2025-11-14 17:56:01,047 - INFO - Finished converting document 4_2024-08-01 in 0.05 sec.
2025-11-14 17:56:01,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,107 - INFO - Going to convert document batch...
2025-11-14 17:56:01,108 - INFO - Processing document 4_2024-08-05
2025-11-14 17:56:01,132 - INFO - Finished converting document 4_2024-08-05 in 0.05 sec.
2025-11-14 17:56:01,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,180 - INFO - Going to convert document batch...
2025-11-14 17:56:01,181 - INFO - Processing document 4_2024-08-15
2025-11-14 17:56:01,203 - INFO - Finished converting document 4_2024-08-15 in 0.05 sec.


Converted 'data\edgar_documents\WMT\4_2024-07-26' --> 'data\processed_data\WMT\4_2024-07-26.md'
Converted 'data\edgar_documents\WMT\4_2024-08-01' --> 'data\processed_data\WMT\4_2024-08-01.md'
Converted 'data\edgar_documents\WMT\4_2024-08-05' --> 'data\processed_data\WMT\4_2024-08-05.md'


2025-11-14 17:56:01,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,249 - INFO - Going to convert document batch...
2025-11-14 17:56:01,250 - INFO - Processing document 4_2024-08-16
2025-11-14 17:56:01,272 - INFO - Finished converting document 4_2024-08-16 in 0.05 sec.
2025-11-14 17:56:01,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,318 - INFO - Going to convert document batch...
2025-11-14 17:56:01,319 - INFO - Processing document 4_2024-08-23
2025-11-14 17:56:01,344 - INFO - Finished converting document 4_2024-08-23 in 0.05 sec.
2025-11-14 17:56:01,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,388 - INFO - Going to convert document batch...
2025-11-14 17:56:01,389 - INFO - Processing document 4_2024-08-29


Converted 'data\edgar_documents\WMT\4_2024-08-15' --> 'data\processed_data\WMT\4_2024-08-15.md'
Converted 'data\edgar_documents\WMT\4_2024-08-16' --> 'data\processed_data\WMT\4_2024-08-16.md'
Converted 'data\edgar_documents\WMT\4_2024-08-23' --> 'data\processed_data\WMT\4_2024-08-23.md'


2025-11-14 17:56:01,407 - INFO - Finished converting document 4_2024-08-29 in 0.05 sec.
2025-11-14 17:56:01,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,458 - INFO - Going to convert document batch...
2025-11-14 17:56:01,458 - INFO - Processing document 4_2024-09-05
2025-11-14 17:56:01,503 - INFO - Finished converting document 4_2024-09-05 in 0.08 sec.
2025-11-14 17:56:01,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,589 - INFO - Going to convert document batch...
2025-11-14 17:56:01,591 - INFO - Processing document 4_2024-09-10


Converted 'data\edgar_documents\WMT\4_2024-08-29' --> 'data\processed_data\WMT\4_2024-08-29.md'
Converted 'data\edgar_documents\WMT\4_2024-09-05' --> 'data\processed_data\WMT\4_2024-09-05.md'


2025-11-14 17:56:01,628 - INFO - Finished converting document 4_2024-09-10 in 0.06 sec.
2025-11-14 17:56:01,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,692 - INFO - Going to convert document batch...
2025-11-14 17:56:01,694 - INFO - Processing document 4_2024-09-12
2025-11-14 17:56:01,724 - INFO - Finished converting document 4_2024-09-12 in 0.06 sec.
2025-11-14 17:56:01,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,802 - INFO - Going to convert document batch...
2025-11-14 17:56:01,804 - INFO - Processing document 4_2024-09-13
2025-11-14 17:56:01,843 - INFO - Finished converting document 4_2024-09-13 in 0.09 sec.


Converted 'data\edgar_documents\WMT\4_2024-09-10' --> 'data\processed_data\WMT\4_2024-09-10.md'
Converted 'data\edgar_documents\WMT\4_2024-09-12' --> 'data\processed_data\WMT\4_2024-09-12.md'


2025-11-14 17:56:01,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,896 - INFO - Going to convert document batch...
2025-11-14 17:56:01,897 - INFO - Processing document 4_2024-09-18
2025-11-14 17:56:01,918 - INFO - Finished converting document 4_2024-09-18 in 0.05 sec.
2025-11-14 17:56:01,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:01,967 - INFO - Going to convert document batch...
2025-11-14 17:56:01,968 - INFO - Processing document 4_2024-09-19
2025-11-14 17:56:02,003 - INFO - Finished converting document 4_2024-09-19 in 0.06 sec.
2025-11-14 17:56:02,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:02,054 - INFO - Going to convert document batch...
2025-11-14 17:56:02,054 - INFO - Processing document 4_2024-09-26


Converted 'data\edgar_documents\WMT\4_2024-09-13' --> 'data\processed_data\WMT\4_2024-09-13.md'
Converted 'data\edgar_documents\WMT\4_2024-09-18' --> 'data\processed_data\WMT\4_2024-09-18.md'
Converted 'data\edgar_documents\WMT\4_2024-09-19' --> 'data\processed_data\WMT\4_2024-09-19.md'


2025-11-14 17:56:02,073 - INFO - Finished converting document 4_2024-09-26 in 0.05 sec.
2025-11-14 17:56:02,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:02,117 - INFO - Going to convert document batch...
2025-11-14 17:56:02,118 - INFO - Processing document 4_2024-09-30
2025-11-14 17:56:02,149 - INFO - Finished converting document 4_2024-09-30 in 0.05 sec.
2025-11-14 17:56:02,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:02,234 - INFO - Going to convert document batch...
2025-11-14 17:56:02,235 - INFO - Processing document 4_2024-10-02
2025-11-14 17:56:02,257 - INFO - Finished converting document 4_2024-10-02 in 0.06 sec.


Converted 'data\edgar_documents\WMT\4_2024-09-26' --> 'data\processed_data\WMT\4_2024-09-26.md'
Converted 'data\edgar_documents\WMT\4_2024-09-30' --> 'data\processed_data\WMT\4_2024-09-30.md'
Converted 'data\edgar_documents\WMT\4_2024-10-02' --> 'data\processed_data\WMT\4_2024-10-02.md'


2025-11-14 17:56:02,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:02,300 - INFO - Going to convert document batch...
2025-11-14 17:56:02,301 - INFO - Processing document 4_2024-10-03
2025-11-14 17:56:02,544 - INFO - Finished converting document 4_2024-10-03 in 0.27 sec.
2025-11-14 17:56:02,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:02,582 - INFO - Going to convert document batch...
2025-11-14 17:56:02,583 - INFO - Processing document 4_2024-10-10
2025-11-14 17:56:02,600 - INFO - Finished converting document 4_2024-10-10 in 0.03 sec.
2025-11-14 17:56:02,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:02,657 - INFO - Going to convert document batch...
2025-11-14 17:56:02,658 - INFO - Processing document 4_2024-10-16
2025-11-14 17:56:02,677 - INFO - Finished converting document 4_2024-10-16 in 0.05 sec.
2025-11-14 17:56:02,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:

Converted 'data\edgar_documents\WMT\4_2024-10-03' --> 'data\processed_data\WMT\4_2024-10-03.md'
Converted 'data\edgar_documents\WMT\4_2024-10-10' --> 'data\processed_data\WMT\4_2024-10-10.md'
Converted 'data\edgar_documents\WMT\4_2024-10-16' --> 'data\processed_data\WMT\4_2024-10-16.md'
Converted 'data\edgar_documents\WMT\4_2024-10-23' --> 'data\processed_data\WMT\4_2024-10-23.md'


2025-11-14 17:56:02,781 - INFO - Going to convert document batch...
2025-11-14 17:56:02,782 - INFO - Processing document 4_2024-10-25
2025-11-14 17:56:02,806 - INFO - Finished converting document 4_2024-10-25 in 0.05 sec.
2025-11-14 17:56:02,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:02,855 - INFO - Going to convert document batch...
2025-11-14 17:56:02,857 - INFO - Processing document 4_2024-11-05
2025-11-14 17:56:02,881 - INFO - Finished converting document 4_2024-11-05 in 0.05 sec.
2025-11-14 17:56:02,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:02,927 - INFO - Going to convert document batch...
2025-11-14 17:56:02,928 - INFO - Processing document 4_2024-11-18
2025-11-14 17:56:02,948 - INFO - Finished converting document 4_2024-11-18 in 0.05 sec.
2025-11-14 17:56:02,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:02,994 - INFO - Going to convert document batch...
2025-11-14 17:56:02,996 - 

Converted 'data\edgar_documents\WMT\4_2024-10-25' --> 'data\processed_data\WMT\4_2024-10-25.md'
Converted 'data\edgar_documents\WMT\4_2024-11-05' --> 'data\processed_data\WMT\4_2024-11-05.md'
Converted 'data\edgar_documents\WMT\4_2024-11-18' --> 'data\processed_data\WMT\4_2024-11-18.md'


2025-11-14 17:56:03,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:03,056 - INFO - Going to convert document batch...
2025-11-14 17:56:03,057 - INFO - Processing document 4_2024-11-29
2025-11-14 17:56:03,077 - INFO - Finished converting document 4_2024-11-29 in 0.05 sec.
2025-11-14 17:56:03,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:03,146 - INFO - Going to convert document batch...
2025-11-14 17:56:03,148 - INFO - Processing document 4_2024-12-04
2025-11-14 17:56:03,188 - INFO - Finished converting document 4_2024-12-04 in 0.09 sec.
2025-11-14 17:56:03,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2024-11-21' --> 'data\processed_data\WMT\4_2024-11-21.md'
Converted 'data\edgar_documents\WMT\4_2024-11-29' --> 'data\processed_data\WMT\4_2024-11-29.md'
Converted 'data\edgar_documents\WMT\4_2024-12-04' --> 'data\processed_data\WMT\4_2024-12-04.md'


2025-11-14 17:56:03,238 - INFO - Going to convert document batch...
2025-11-14 17:56:03,239 - INFO - Processing document 4_2024-12-05
2025-11-14 17:56:03,268 - INFO - Finished converting document 4_2024-12-05 in 0.05 sec.
2025-11-14 17:56:03,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:03,322 - INFO - Going to convert document batch...
2025-11-14 17:56:03,323 - INFO - Processing document 4_2024-12-17
2025-11-14 17:56:03,373 - INFO - Finished converting document 4_2024-12-17 in 0.08 sec.
2025-11-14 17:56:03,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:03,468 - INFO - Going to convert document batch...
2025-11-14 17:56:03,469 - INFO - Processing document 4_2024-12-19


Converted 'data\edgar_documents\WMT\4_2024-12-05' --> 'data\processed_data\WMT\4_2024-12-05.md'
Converted 'data\edgar_documents\WMT\4_2024-12-17' --> 'data\processed_data\WMT\4_2024-12-17.md'


2025-11-14 17:56:03,514 - INFO - Finished converting document 4_2024-12-19 in 0.09 sec.
2025-11-14 17:56:03,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:03,594 - INFO - Going to convert document batch...
2025-11-14 17:56:03,596 - INFO - Processing document 4_2024-12-26
2025-11-14 17:56:03,649 - INFO - Finished converting document 4_2024-12-26 in 0.08 sec.
2025-11-14 17:56:03,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:03,731 - INFO - Going to convert document batch...
2025-11-14 17:56:03,733 - INFO - Processing document 4_2024-12-27
2025-11-14 17:56:03,766 - INFO - Finished converting document 4_2024-12-27 in 0.06 sec.


Converted 'data\edgar_documents\WMT\4_2024-12-19' --> 'data\processed_data\WMT\4_2024-12-19.md'
Converted 'data\edgar_documents\WMT\4_2024-12-26' --> 'data\processed_data\WMT\4_2024-12-26.md'


2025-11-14 17:56:03,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:03,836 - INFO - Going to convert document batch...
2025-11-14 17:56:03,837 - INFO - Processing document 4_2025-01-03
2025-11-14 17:56:03,865 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 17:56:03,904 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:03,916 - INFO - Going to convert document batch...
2025-11-14 17:56:03,918 - INFO - Processing document 4_2025-01-15
2025-11-14 17:56:03,945 - INFO - Finished converting document 4_2025-01-15 in 0.05 sec.
2025-11-14 17:56:03,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:03,992 - INFO - Going to convert document batch...
2025-11-14 17:56:03,994 - INFO - Processing document 4_2025-01-17


Converted 'data\edgar_documents\WMT\4_2024-12-27' --> 'data\processed_data\WMT\4_2024-12-27.md'
Converted 'data\edgar_documents\WMT\4_2025-01-03' --> 'data\processed_data\WMT\4_2025-01-03.md'
Converted 'data\edgar_documents\WMT\4_2025-01-15' --> 'data\processed_data\WMT\4_2025-01-15.md'


2025-11-14 17:56:04,017 - INFO - Finished converting document 4_2025-01-17 in 0.05 sec.
2025-11-14 17:56:04,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,074 - INFO - Going to convert document batch...
2025-11-14 17:56:04,075 - INFO - Processing document 4_2025-01-24
2025-11-14 17:56:04,124 - INFO - Finished converting document 4_2025-01-24 in 0.08 sec.
2025-11-14 17:56:04,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,208 - INFO - Going to convert document batch...
2025-11-14 17:56:04,209 - INFO - Processing document 4_2025-02-03
2025-11-14 17:56:04,250 - INFO - Finished converting document 4_2025-02-03 in 0.08 sec.


Converted 'data\edgar_documents\WMT\4_2025-01-17' --> 'data\processed_data\WMT\4_2025-01-17.md'
Converted 'data\edgar_documents\WMT\4_2025-01-24' --> 'data\processed_data\WMT\4_2025-01-24.md'


2025-11-14 17:56:04,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,307 - INFO - Going to convert document batch...
2025-11-14 17:56:04,308 - INFO - Processing document 4_2025-02-05
2025-11-14 17:56:04,335 - INFO - Finished converting document 4_2025-02-05 in 0.05 sec.
2025-11-14 17:56:04,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,385 - INFO - Going to convert document batch...
2025-11-14 17:56:04,385 - INFO - Processing document 4_2025-02-13
2025-11-14 17:56:04,407 - INFO - Finished converting document 4_2025-02-13 in 0.05 sec.
2025-11-14 17:56:04,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,453 - INFO - Going to convert document batch...
2025-11-14 17:56:04,454 - INFO - Processing document 4_2025-02-20


Converted 'data\edgar_documents\WMT\4_2025-02-03' --> 'data\processed_data\WMT\4_2025-02-03.md'
Converted 'data\edgar_documents\WMT\4_2025-02-05' --> 'data\processed_data\WMT\4_2025-02-05.md'
Converted 'data\edgar_documents\WMT\4_2025-02-13' --> 'data\processed_data\WMT\4_2025-02-13.md'


2025-11-14 17:56:04,474 - INFO - Finished converting document 4_2025-02-20 in 0.05 sec.
2025-11-14 17:56:04,512 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,522 - INFO - Going to convert document batch...
2025-11-14 17:56:04,523 - INFO - Processing document 4_2025-02-24
2025-11-14 17:56:04,543 - INFO - Finished converting document 4_2025-02-24 in 0.05 sec.
2025-11-14 17:56:04,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,595 - INFO - Going to convert document batch...
2025-11-14 17:56:04,596 - INFO - Processing document 4_2025-02-28
2025-11-14 17:56:04,623 - INFO - Finished converting document 4_2025-02-28 in 0.06 sec.
2025-11-14 17:56:04,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,672 - INFO - Going to convert document batch...
2025-11-14 17:56:04,673 - INFO - Processing document 4_2025-03-04
2025-11-14 17:56:04,695 - INFO - Finished converting document 4_2025-03-04 in 0.05 sec.


Converted 'data\edgar_documents\WMT\4_2025-02-20' --> 'data\processed_data\WMT\4_2025-02-20.md'
Converted 'data\edgar_documents\WMT\4_2025-02-24' --> 'data\processed_data\WMT\4_2025-02-24.md'
Converted 'data\edgar_documents\WMT\4_2025-02-28' --> 'data\processed_data\WMT\4_2025-02-28.md'


2025-11-14 17:56:04,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,744 - INFO - Going to convert document batch...
2025-11-14 17:56:04,745 - INFO - Processing document 4_2025-03-05
2025-11-14 17:56:04,782 - INFO - Finished converting document 4_2025-03-05 in 0.06 sec.
2025-11-14 17:56:04,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,880 - INFO - Going to convert document batch...
2025-11-14 17:56:04,881 - INFO - Processing document 4_2025-03-07


Converted 'data\edgar_documents\WMT\4_2025-03-04' --> 'data\processed_data\WMT\4_2025-03-04.md'
Converted 'data\edgar_documents\WMT\4_2025-03-05' --> 'data\processed_data\WMT\4_2025-03-05.md'


2025-11-14 17:56:04,909 - INFO - Finished converting document 4_2025-03-07 in 0.06 sec.
2025-11-14 17:56:04,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:04,969 - INFO - Going to convert document batch...
2025-11-14 17:56:04,970 - INFO - Processing document 4_2025-03-10
2025-11-14 17:56:05,004 - INFO - Finished converting document 4_2025-03-10 in 0.06 sec.
2025-11-14 17:56:05,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,059 - INFO - Going to convert document batch...
2025-11-14 17:56:05,060 - INFO - Processing document 4_2025-03-13
2025-11-14 17:56:05,084 - INFO - Finished converting document 4_2025-03-13 in 0.05 sec.
2025-11-14 17:56:05,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2025-03-07' --> 'data\processed_data\WMT\4_2025-03-07.md'
Converted 'data\edgar_documents\WMT\4_2025-03-10' --> 'data\processed_data\WMT\4_2025-03-10.md'
Converted 'data\edgar_documents\WMT\4_2025-03-13' --> 'data\processed_data\WMT\4_2025-03-13.md'


2025-11-14 17:56:05,138 - INFO - Going to convert document batch...
2025-11-14 17:56:05,140 - INFO - Processing document 4_2025-03-14
2025-11-14 17:56:05,169 - INFO - Finished converting document 4_2025-03-14 in 0.06 sec.
2025-11-14 17:56:05,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,248 - INFO - Going to convert document batch...
2025-11-14 17:56:05,250 - INFO - Processing document 4_2025-03-18
2025-11-14 17:56:05,301 - INFO - Finished converting document 4_2025-03-18 in 0.09 sec.
2025-11-14 17:56:05,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,367 - INFO - Going to convert document batch...
2025-11-14 17:56:05,368 - INFO - Processing document 4_2025-03-20
2025-11-14 17:56:05,393 - INFO - Finished converting document 4_2025-03-20 in 0.05 sec.


Converted 'data\edgar_documents\WMT\4_2025-03-14' --> 'data\processed_data\WMT\4_2025-03-14.md'
Converted 'data\edgar_documents\WMT\4_2025-03-18' --> 'data\processed_data\WMT\4_2025-03-18.md'


2025-11-14 17:56:05,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,441 - INFO - Going to convert document batch...
2025-11-14 17:56:05,442 - INFO - Processing document 4_2025-03-24
2025-11-14 17:56:05,467 - INFO - Finished converting document 4_2025-03-24 in 0.05 sec.
2025-11-14 17:56:05,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,516 - INFO - Going to convert document batch...
2025-11-14 17:56:05,517 - INFO - Processing document 4_2025-03-28
2025-11-14 17:56:05,540 - INFO - Finished converting document 4_2025-03-28 in 0.05 sec.
2025-11-14 17:56:05,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,592 - INFO - Going to convert document batch...
2025-11-14 17:56:05,593 - INFO - Processing document 4_2025-03-31


Converted 'data\edgar_documents\WMT\4_2025-03-20' --> 'data\processed_data\WMT\4_2025-03-20.md'
Converted 'data\edgar_documents\WMT\4_2025-03-24' --> 'data\processed_data\WMT\4_2025-03-24.md'
Converted 'data\edgar_documents\WMT\4_2025-03-28' --> 'data\processed_data\WMT\4_2025-03-28.md'


2025-11-14 17:56:05,618 - INFO - Finished converting document 4_2025-03-31 in 0.05 sec.
2025-11-14 17:56:05,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,663 - INFO - Going to convert document batch...
2025-11-14 17:56:05,664 - INFO - Processing document 4_2025-04-01
2025-11-14 17:56:05,685 - INFO - Finished converting document 4_2025-04-01 in 0.05 sec.
2025-11-14 17:56:05,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,733 - INFO - Going to convert document batch...
2025-11-14 17:56:05,734 - INFO - Processing document 4_2025-04-03
2025-11-14 17:56:05,755 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.
2025-11-14 17:56:05,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,798 - INFO - Going to convert document batch...
2025-11-14 17:56:05,799 - INFO - Processing document 4_2025-04-10
2025-11-14 17:56:05,817 - INFO - Finished converting document 4_2025-04-10 in 0.03 sec.


Converted 'data\edgar_documents\WMT\4_2025-03-31' --> 'data\processed_data\WMT\4_2025-03-31.md'
Converted 'data\edgar_documents\WMT\4_2025-04-01' --> 'data\processed_data\WMT\4_2025-04-01.md'
Converted 'data\edgar_documents\WMT\4_2025-04-03' --> 'data\processed_data\WMT\4_2025-04-03.md'


2025-11-14 17:56:05,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,859 - INFO - Going to convert document batch...
2025-11-14 17:56:05,859 - INFO - Processing document 4_2025-04-17
2025-11-14 17:56:05,878 - INFO - Finished converting document 4_2025-04-17 in 0.03 sec.
2025-11-14 17:56:05,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:05,930 - INFO - Going to convert document batch...
2025-11-14 17:56:05,931 - INFO - Processing document 4_2025-04-23
2025-11-14 17:56:05,949 - INFO - Finished converting document 4_2025-04-23 in 0.06 sec.
2025-11-14 17:56:06,019 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:56:06,020 - ERROR - Input document 4_2025-04-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\WMT\4_2025-04-10' --> 'data\processed_data\WMT\4_2025-04-10.md'
Converted 'data\edgar_documents\WMT\4_2025-04-17' --> 'data\processed_data\WMT\4_2025-04-17.md'
Converted 'data\edgar_documents\WMT\4_2025-04-23' --> 'data\processed_data\WMT\4_2025-04-23.md'
Error processing data\edgar_documents\WMT\4_2025-04-25: File format not allowed: data\edgar_documents\WMT\4_2025-04-25


2025-11-14 17:56:06,057 - INFO - Going to convert document batch...
2025-11-14 17:56:06,059 - INFO - Processing document 4_2025-04-28
2025-11-14 17:56:06,103 - INFO - Finished converting document 4_2025-04-28 in 0.08 sec.
2025-11-14 17:56:06,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,169 - INFO - Going to convert document batch...
2025-11-14 17:56:06,170 - INFO - Processing document 4_2025-05-05
2025-11-14 17:56:06,196 - INFO - Finished converting document 4_2025-05-05 in 0.05 sec.
2025-11-14 17:56:06,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,267 - INFO - Going to convert document batch...
2025-11-14 17:56:06,268 - INFO - Processing document 4_2025-05-08
2025-11-14 17:56:06,293 - INFO - Finished converting document 4_2025-05-08 in 0.08 sec.
2025-11-14 17:56:06,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2025-04-28' --> 'data\processed_data\WMT\4_2025-04-28.md'
Converted 'data\edgar_documents\WMT\4_2025-05-05' --> 'data\processed_data\WMT\4_2025-05-05.md'
Converted 'data\edgar_documents\WMT\4_2025-05-08' --> 'data\processed_data\WMT\4_2025-05-08.md'


2025-11-14 17:56:06,342 - INFO - Going to convert document batch...
2025-11-14 17:56:06,343 - INFO - Processing document 4_2025-05-19
2025-11-14 17:56:06,365 - INFO - Finished converting document 4_2025-05-19 in 0.05 sec.
2025-11-14 17:56:06,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,419 - INFO - Going to convert document batch...
2025-11-14 17:56:06,420 - INFO - Processing document 4_2025-05-20
2025-11-14 17:56:06,477 - INFO - Finished converting document 4_2025-05-20 in 0.08 sec.
2025-11-14 17:56:06,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,535 - INFO - Going to convert document batch...
2025-11-14 17:56:06,536 - INFO - Processing document 4_2025-05-21
2025-11-14 17:56:06,560 - INFO - Finished converting document 4_2025-05-21 in 0.06 sec.


Converted 'data\edgar_documents\WMT\4_2025-05-19' --> 'data\processed_data\WMT\4_2025-05-19.md'
Converted 'data\edgar_documents\WMT\4_2025-05-20' --> 'data\processed_data\WMT\4_2025-05-20.md'


2025-11-14 17:56:06,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,610 - INFO - Going to convert document batch...
2025-11-14 17:56:06,611 - INFO - Processing document 4_2025-05-23
2025-11-14 17:56:06,637 - INFO - Finished converting document 4_2025-05-23 in 0.06 sec.
2025-11-14 17:56:06,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,681 - INFO - Going to convert document batch...
2025-11-14 17:56:06,682 - INFO - Processing document 4_2025-05-29
2025-11-14 17:56:06,703 - INFO - Finished converting document 4_2025-05-29 in 0.05 sec.
2025-11-14 17:56:06,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,769 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\WMT\4_2025-05-21' --> 'data\processed_data\WMT\4_2025-05-21.md'
Converted 'data\edgar_documents\WMT\4_2025-05-23' --> 'data\processed_data\WMT\4_2025-05-23.md'
Converted 'data\edgar_documents\WMT\4_2025-05-29' --> 'data\processed_data\WMT\4_2025-05-29.md'


2025-11-14 17:56:06,770 - INFO - Processing document 4_2025-06-04
2025-11-14 17:56:06,793 - INFO - Finished converting document 4_2025-06-04 in 0.08 sec.
2025-11-14 17:56:06,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,839 - INFO - Going to convert document batch...
2025-11-14 17:56:06,840 - INFO - Processing document 4_2025-06-09
2025-11-14 17:56:06,859 - INFO - Finished converting document 4_2025-06-09 in 0.05 sec.
2025-11-14 17:56:06,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,903 - INFO - Going to convert document batch...
2025-11-14 17:56:06,904 - INFO - Processing document 4_2025-06-17
2025-11-14 17:56:06,922 - INFO - Finished converting document 4_2025-06-17 in 0.05 sec.
2025-11-14 17:56:06,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:06,965 - INFO - Going to convert document batch...
2025-11-14 17:56:06,966 - INFO - Processing document 4_2025-06-23
2025-11-14 17:56:06,985 - IN

Converted 'data\edgar_documents\WMT\4_2025-06-04' --> 'data\processed_data\WMT\4_2025-06-04.md'
Converted 'data\edgar_documents\WMT\4_2025-06-09' --> 'data\processed_data\WMT\4_2025-06-09.md'
Converted 'data\edgar_documents\WMT\4_2025-06-17' --> 'data\processed_data\WMT\4_2025-06-17.md'


2025-11-14 17:56:07,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,031 - INFO - Going to convert document batch...
2025-11-14 17:56:07,031 - INFO - Processing document 4_2025-06-26
2025-11-14 17:56:07,053 - INFO - Finished converting document 4_2025-06-26 in 0.05 sec.
2025-11-14 17:56:07,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,096 - INFO - Going to convert document batch...
2025-11-14 17:56:07,096 - INFO - Processing document 4_2025-06-27
2025-11-14 17:56:07,116 - INFO - Finished converting document 4_2025-06-27 in 0.03 sec.
2025-11-14 17:56:07,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,175 - INFO - Going to convert document batch...
2025-11-14 17:56:07,177 - INFO - Processing document 4_2025-07-01


Converted 'data\edgar_documents\WMT\4_2025-06-23' --> 'data\processed_data\WMT\4_2025-06-23.md'
Converted 'data\edgar_documents\WMT\4_2025-06-26' --> 'data\processed_data\WMT\4_2025-06-26.md'
Converted 'data\edgar_documents\WMT\4_2025-06-27' --> 'data\processed_data\WMT\4_2025-06-27.md'


2025-11-14 17:56:07,205 - INFO - Finished converting document 4_2025-07-01 in 0.06 sec.
2025-11-14 17:56:07,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,256 - INFO - Going to convert document batch...
2025-11-14 17:56:07,257 - INFO - Processing document 4_2025-07-02
2025-11-14 17:56:07,281 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 17:56:07,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,330 - INFO - Going to convert document batch...
2025-11-14 17:56:07,331 - INFO - Processing document 4_2025-07-17
2025-11-14 17:56:07,355 - INFO - Finished converting document 4_2025-07-17 in 0.05 sec.
2025-11-14 17:56:07,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,409 - INFO - Going to convert document batch...
2025-11-14 17:56:07,409 - INFO - Processing document 4_2025-07-21


Converted 'data\edgar_documents\WMT\4_2025-07-01' --> 'data\processed_data\WMT\4_2025-07-01.md'
Converted 'data\edgar_documents\WMT\4_2025-07-02' --> 'data\processed_data\WMT\4_2025-07-02.md'
Converted 'data\edgar_documents\WMT\4_2025-07-17' --> 'data\processed_data\WMT\4_2025-07-17.md'


2025-11-14 17:56:07,435 - INFO - Finished converting document 4_2025-07-21 in 0.06 sec.
2025-11-14 17:56:07,478 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,489 - INFO - Going to convert document batch...
2025-11-14 17:56:07,490 - INFO - Processing document 4_2025-07-22
2025-11-14 17:56:07,514 - INFO - Finished converting document 4_2025-07-22 in 0.05 sec.
2025-11-14 17:56:07,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,560 - INFO - Going to convert document batch...
2025-11-14 17:56:07,561 - INFO - Processing document 4_2025-07-28


Converted 'data\edgar_documents\WMT\4_2025-07-21' --> 'data\processed_data\WMT\4_2025-07-21.md'
Converted 'data\edgar_documents\WMT\4_2025-07-22' --> 'data\processed_data\WMT\4_2025-07-22.md'


2025-11-14 17:56:07,827 - INFO - Finished converting document 4_2025-07-28 in 0.30 sec.
2025-11-14 17:56:07,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,877 - INFO - Going to convert document batch...
2025-11-14 17:56:07,877 - INFO - Processing document 4_2025-08-04
2025-11-14 17:56:07,899 - INFO - Finished converting document 4_2025-08-04 in 0.05 sec.
2025-11-14 17:56:07,950 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:07,959 - INFO - Going to convert document batch...
2025-11-14 17:56:07,959 - INFO - Processing document 4_2025-08-14
2025-11-14 17:56:07,977 - INFO - Finished converting document 4_2025-08-14 in 0.05 sec.
2025-11-14 17:56:08,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,020 - INFO - Going to convert document batch...
2025-11-14 17:56:08,021 - INFO - Processing document 4_2025-08-19
2025-11-14 17:56:08,039 - INFO - Finished converting document 4_2025-08-19 in 0.03 sec.


Converted 'data\edgar_documents\WMT\4_2025-07-28' --> 'data\processed_data\WMT\4_2025-07-28.md'
Converted 'data\edgar_documents\WMT\4_2025-08-04' --> 'data\processed_data\WMT\4_2025-08-04.md'
Converted 'data\edgar_documents\WMT\4_2025-08-14' --> 'data\processed_data\WMT\4_2025-08-14.md'


2025-11-14 17:56:08,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,079 - INFO - Going to convert document batch...
2025-11-14 17:56:08,080 - INFO - Processing document 4_2025-08-20
2025-11-14 17:56:08,101 - INFO - Finished converting document 4_2025-08-20 in 0.03 sec.
2025-11-14 17:56:08,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,153 - INFO - Going to convert document batch...
2025-11-14 17:56:08,154 - INFO - Processing document 4_2025-08-21
2025-11-14 17:56:08,182 - INFO - Finished converting document 4_2025-08-21 in 0.06 sec.
2025-11-14 17:56:08,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,240 - INFO - Going to convert document batch...
2025-11-14 17:56:08,240 - INFO - Processing document 4_2025-08-25


Converted 'data\edgar_documents\WMT\4_2025-08-19' --> 'data\processed_data\WMT\4_2025-08-19.md'
Converted 'data\edgar_documents\WMT\4_2025-08-20' --> 'data\processed_data\WMT\4_2025-08-20.md'
Converted 'data\edgar_documents\WMT\4_2025-08-21' --> 'data\processed_data\WMT\4_2025-08-21.md'


2025-11-14 17:56:08,264 - INFO - Finished converting document 4_2025-08-25 in 0.06 sec.
2025-11-14 17:56:08,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,316 - INFO - Going to convert document batch...
2025-11-14 17:56:08,317 - INFO - Processing document 4_2025-08-26
2025-11-14 17:56:08,354 - INFO - Finished converting document 4_2025-08-26 in 0.08 sec.
2025-11-14 17:56:08,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,450 - INFO - Going to convert document batch...
2025-11-14 17:56:08,451 - INFO - Processing document 4_2025-08-29


Converted 'data\edgar_documents\WMT\4_2025-08-25' --> 'data\processed_data\WMT\4_2025-08-25.md'
Converted 'data\edgar_documents\WMT\4_2025-08-26' --> 'data\processed_data\WMT\4_2025-08-26.md'


2025-11-14 17:56:08,484 - INFO - Finished converting document 4_2025-08-29 in 0.08 sec.
2025-11-14 17:56:08,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,547 - INFO - Going to convert document batch...
2025-11-14 17:56:08,548 - INFO - Processing document 4_2025-09-02
2025-11-14 17:56:08,579 - INFO - Finished converting document 4_2025-09-02 in 0.06 sec.
2025-11-14 17:56:08,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,630 - INFO - Going to convert document batch...
2025-11-14 17:56:08,630 - INFO - Processing document 4_2025-09-03
2025-11-14 17:56:08,654 - INFO - Finished converting document 4_2025-09-03 in 0.05 sec.
2025-11-14 17:56:08,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,699 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\WMT\4_2025-08-29' --> 'data\processed_data\WMT\4_2025-08-29.md'
Converted 'data\edgar_documents\WMT\4_2025-09-02' --> 'data\processed_data\WMT\4_2025-09-02.md'
Converted 'data\edgar_documents\WMT\4_2025-09-03' --> 'data\processed_data\WMT\4_2025-09-03.md'


2025-11-14 17:56:08,700 - INFO - Processing document 4_2025-09-10
2025-11-14 17:56:08,719 - INFO - Finished converting document 4_2025-09-10 in 0.05 sec.
2025-11-14 17:56:08,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,762 - INFO - Going to convert document batch...
2025-11-14 17:56:08,762 - INFO - Processing document 4_2025-09-11
2025-11-14 17:56:08,783 - INFO - Finished converting document 4_2025-09-11 in 0.05 sec.
2025-11-14 17:56:08,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:08,863 - INFO - Going to convert document batch...
2025-11-14 17:56:08,863 - INFO - Processing document 4_2025-09-16
2025-11-14 17:56:08,885 - INFO - Finished converting document 4_2025-09-16 in 0.05 sec.
2025-11-14 17:56:08,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2025-09-10' --> 'data\processed_data\WMT\4_2025-09-10.md'
Converted 'data\edgar_documents\WMT\4_2025-09-11' --> 'data\processed_data\WMT\4_2025-09-11.md'
Converted 'data\edgar_documents\WMT\4_2025-09-16' --> 'data\processed_data\WMT\4_2025-09-16.md'


2025-11-14 17:56:08,931 - INFO - Going to convert document batch...
2025-11-14 17:56:08,933 - INFO - Processing document 4_2025-09-17
2025-11-14 17:56:08,955 - INFO - Finished converting document 4_2025-09-17 in 0.05 sec.
2025-11-14 17:56:08,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,001 - INFO - Going to convert document batch...
2025-11-14 17:56:09,002 - INFO - Processing document 4_2025-09-22
2025-11-14 17:56:09,024 - INFO - Finished converting document 4_2025-09-22 in 0.05 sec.
2025-11-14 17:56:09,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,074 - INFO - Going to convert document batch...
2025-11-14 17:56:09,074 - INFO - Processing document 4_2025-09-24
2025-11-14 17:56:09,096 - INFO - Finished converting document 4_2025-09-24 in 0.05 sec.
2025-11-14 17:56:09,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2025-09-17' --> 'data\processed_data\WMT\4_2025-09-17.md'
Converted 'data\edgar_documents\WMT\4_2025-09-22' --> 'data\processed_data\WMT\4_2025-09-22.md'
Converted 'data\edgar_documents\WMT\4_2025-09-24' --> 'data\processed_data\WMT\4_2025-09-24.md'


2025-11-14 17:56:09,164 - INFO - Going to convert document batch...
2025-11-14 17:56:09,166 - INFO - Processing document 4_2025-09-26
2025-11-14 17:56:09,190 - INFO - Finished converting document 4_2025-09-26 in 0.06 sec.
2025-11-14 17:56:09,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,249 - INFO - Going to convert document batch...
2025-11-14 17:56:09,252 - INFO - Processing document 4_2025-10-02
2025-11-14 17:56:09,287 - INFO - Finished converting document 4_2025-10-02 in 0.06 sec.
2025-11-14 17:56:09,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,355 - INFO - Going to convert document batch...
2025-11-14 17:56:09,356 - INFO - Processing document 4_2025-10-09
2025-11-14 17:56:09,379 - INFO - Finished converting document 4_2025-10-09 in 0.06 sec.


Converted 'data\edgar_documents\WMT\4_2025-09-26' --> 'data\processed_data\WMT\4_2025-09-26.md'
Converted 'data\edgar_documents\WMT\4_2025-10-02' --> 'data\processed_data\WMT\4_2025-10-02.md'


2025-11-14 17:56:09,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,427 - INFO - Going to convert document batch...
2025-11-14 17:56:09,428 - INFO - Processing document 4_2025-10-17
2025-11-14 17:56:09,455 - INFO - Finished converting document 4_2025-10-17 in 0.05 sec.
2025-11-14 17:56:09,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,511 - INFO - Going to convert document batch...
2025-11-14 17:56:09,511 - INFO - Processing document 4_2025-10-22
2025-11-14 17:56:09,533 - INFO - Finished converting document 4_2025-10-22 in 0.05 sec.
2025-11-14 17:56:09,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,581 - INFO - Going to convert document batch...
2025-11-14 17:56:09,581 - INFO - Processing document 4_2025-10-24
2025-11-14 17:56:09,607 - INFO - Finished converting document 4_2025-10-24 in 0.06 sec.


Converted 'data\edgar_documents\WMT\4_2025-10-09' --> 'data\processed_data\WMT\4_2025-10-09.md'
Converted 'data\edgar_documents\WMT\4_2025-10-17' --> 'data\processed_data\WMT\4_2025-10-17.md'
Converted 'data\edgar_documents\WMT\4_2025-10-22' --> 'data\processed_data\WMT\4_2025-10-22.md'


2025-11-14 17:56:09,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,651 - INFO - Going to convert document batch...
2025-11-14 17:56:09,653 - INFO - Processing document 4_2025-11-04
2025-11-14 17:56:09,674 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 17:56:09,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,744 - INFO - Going to convert document batch...
2025-11-14 17:56:09,745 - INFO - Processing document 4_2025-11-06
2025-11-14 17:56:09,771 - INFO - Finished converting document 4_2025-11-06 in 0.06 sec.
2025-11-14 17:56:09,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\4_2025-10-24' --> 'data\processed_data\WMT\4_2025-10-24.md'
Converted 'data\edgar_documents\WMT\4_2025-11-04' --> 'data\processed_data\WMT\4_2025-11-04.md'
Converted 'data\edgar_documents\WMT\4_2025-11-06' --> 'data\processed_data\WMT\4_2025-11-06.md'


2025-11-14 17:56:09,844 - INFO - Going to convert document batch...
2025-11-14 17:56:09,845 - INFO - Processing document 8-K_2023-02-21
2025-11-14 17:56:09,866 - INFO - Finished converting document 8-K_2023-02-21 in 0.06 sec.
2025-11-14 17:56:09,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,908 - INFO - Going to convert document batch...
2025-11-14 17:56:09,909 - INFO - Processing document 8-K_2023-02-24
2025-11-14 17:56:09,939 - INFO - Finished converting document 8-K_2023-02-24 in 0.06 sec.
2025-11-14 17:56:09,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:09,991 - INFO - Going to convert document batch...
2025-11-14 17:56:09,992 - INFO - Processing document 8-K_2023-03-06
2025-11-14 17:56:10,009 - INFO - Finished converting document 8-K_2023-03-06 in 0.05 sec.
2025-11-14 17:56:10,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,048 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\WMT\8-K_2023-02-21' --> 'data\processed_data\WMT\8-K_2023-02-21.md'
Converted 'data\edgar_documents\WMT\8-K_2023-02-24' --> 'data\processed_data\WMT\8-K_2023-02-24.md'
Converted 'data\edgar_documents\WMT\8-K_2023-03-06' --> 'data\processed_data\WMT\8-K_2023-03-06.md'


2025-11-14 17:56:10,067 - INFO - Finished converting document 8-K_2023-03-24 in 0.05 sec.
2025-11-14 17:56:10,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,107 - INFO - Going to convert document batch...
2025-11-14 17:56:10,109 - INFO - Processing document 8-K_2023-04-04
2025-11-14 17:56:10,125 - INFO - Finished converting document 8-K_2023-04-04 in 0.05 sec.
2025-11-14 17:56:10,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,168 - INFO - Going to convert document batch...
2025-11-14 17:56:10,169 - INFO - Processing document 8-K_2023-04-17
2025-11-14 17:56:10,200 - INFO - Finished converting document 8-K_2023-04-17 in 0.06 sec.
2025-11-14 17:56:10,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,245 - INFO - Going to convert document batch...
2025-11-14 17:56:10,245 - INFO - Processing document 8-K_2023-05-18
2025-11-14 17:56:10,261 - INFO - Finished converting document 8-K_2023-05-18 in 0.

Converted 'data\edgar_documents\WMT\8-K_2023-03-24' --> 'data\processed_data\WMT\8-K_2023-03-24.md'
Converted 'data\edgar_documents\WMT\8-K_2023-04-04' --> 'data\processed_data\WMT\8-K_2023-04-04.md'
Converted 'data\edgar_documents\WMT\8-K_2023-04-17' --> 'data\processed_data\WMT\8-K_2023-04-17.md'


2025-11-14 17:56:10,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,316 - INFO - Going to convert document batch...
2025-11-14 17:56:10,317 - INFO - Processing document 8-K_2023-06-02
2025-11-14 17:56:10,371 - INFO - Finished converting document 8-K_2023-06-02 in 0.11 sec.
2025-11-14 17:56:10,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,427 - INFO - Going to convert document batch...
2025-11-14 17:56:10,428 - INFO - Processing document 8-K_2023-08-16
2025-11-14 17:56:10,444 - INFO - Finished converting document 8-K_2023-08-16 in 0.03 sec.


Converted 'data\edgar_documents\WMT\8-K_2023-05-18' --> 'data\processed_data\WMT\8-K_2023-05-18.md'
Converted 'data\edgar_documents\WMT\8-K_2023-06-02' --> 'data\processed_data\WMT\8-K_2023-06-02.md'


2025-11-14 17:56:10,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,480 - INFO - Going to convert document batch...
2025-11-14 17:56:10,480 - INFO - Processing document 8-K_2023-08-17
2025-11-14 17:56:10,496 - INFO - Finished converting document 8-K_2023-08-17 in 0.05 sec.
2025-11-14 17:56:10,521 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,540 - INFO - Going to convert document batch...
2025-11-14 17:56:10,541 - INFO - Processing document 8-K_2023-08-22
2025-11-14 17:56:10,567 - INFO - Finished converting document 8-K_2023-08-22 in 0.06 sec.
2025-11-14 17:56:10,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,615 - INFO - Going to convert document batch...
2025-11-14 17:56:10,615 - INFO - Processing document 8-K_2023-11-16
2025-11-14 17:56:10,637 - INFO - Finished converting document 8-K_2023-11-16 in 0.06 sec.


Converted 'data\edgar_documents\WMT\8-K_2023-08-16' --> 'data\processed_data\WMT\8-K_2023-08-16.md'
Converted 'data\edgar_documents\WMT\8-K_2023-08-17' --> 'data\processed_data\WMT\8-K_2023-08-17.md'
Converted 'data\edgar_documents\WMT\8-K_2023-08-22' --> 'data\processed_data\WMT\8-K_2023-08-22.md'


2025-11-14 17:56:10,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,680 - INFO - Going to convert document batch...
2025-11-14 17:56:10,680 - INFO - Processing document 8-K_2024-01-31
2025-11-14 17:56:10,701 - INFO - Finished converting document 8-K_2024-01-31 in 0.06 sec.
2025-11-14 17:56:10,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,743 - INFO - Going to convert document batch...
2025-11-14 17:56:10,743 - INFO - Processing document 8-K_2024-02-20
2025-11-14 17:56:10,764 - INFO - Finished converting document 8-K_2024-02-20 in 0.05 sec.
2025-11-14 17:56:10,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,805 - INFO - Going to convert document batch...
2025-11-14 17:56:10,806 - INFO - Processing document 8-K_2024-02-23
2025-11-14 17:56:10,824 - INFO - Finished converting document 8-K_2024-02-23 in 0.06 sec.


Converted 'data\edgar_documents\WMT\8-K_2023-11-16' --> 'data\processed_data\WMT\8-K_2023-11-16.md'
Converted 'data\edgar_documents\WMT\8-K_2024-01-31' --> 'data\processed_data\WMT\8-K_2024-01-31.md'
Converted 'data\edgar_documents\WMT\8-K_2024-02-20' --> 'data\processed_data\WMT\8-K_2024-02-20.md'


2025-11-14 17:56:10,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,864 - INFO - Going to convert document batch...
2025-11-14 17:56:10,865 - INFO - Processing document 8-K_2024-02-28
2025-11-14 17:56:10,886 - INFO - Finished converting document 8-K_2024-02-28 in 0.06 sec.
2025-11-14 17:56:10,906 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:10,931 - INFO - Going to convert document batch...
2025-11-14 17:56:10,932 - INFO - Processing document 8-K_2024-03-28
2025-11-14 17:56:10,968 - INFO - Finished converting document 8-K_2024-03-28 in 0.08 sec.
2025-11-14 17:56:11,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,020 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\WMT\8-K_2024-02-23' --> 'data\processed_data\WMT\8-K_2024-02-23.md'
Converted 'data\edgar_documents\WMT\8-K_2024-02-28' --> 'data\processed_data\WMT\8-K_2024-02-28.md'
Converted 'data\edgar_documents\WMT\8-K_2024-03-28' --> 'data\processed_data\WMT\8-K_2024-03-28.md'


2025-11-14 17:56:11,021 - INFO - Processing document 8-K_2024-05-16
2025-11-14 17:56:11,046 - INFO - Finished converting document 8-K_2024-05-16 in 0.06 sec.
2025-11-14 17:56:11,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,109 - INFO - Going to convert document batch...
2025-11-14 17:56:11,110 - INFO - Processing document 8-K_2024-06-07
2025-11-14 17:56:11,164 - INFO - Finished converting document 8-K_2024-06-07 in 0.09 sec.
2025-11-14 17:56:11,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,217 - INFO - Going to convert document batch...
2025-11-14 17:56:11,218 - INFO - Processing document 8-K_2024-08-15
2025-11-14 17:56:11,236 - INFO - Finished converting document 8-K_2024-08-15 in 0.05 sec.


Converted 'data\edgar_documents\WMT\8-K_2024-05-16' --> 'data\processed_data\WMT\8-K_2024-05-16.md'
Converted 'data\edgar_documents\WMT\8-K_2024-06-07' --> 'data\processed_data\WMT\8-K_2024-06-07.md'


2025-11-14 17:56:11,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,271 - INFO - Going to convert document batch...
2025-11-14 17:56:11,272 - INFO - Processing document 8-K_2024-09-06
2025-11-14 17:56:11,289 - INFO - Finished converting document 8-K_2024-09-06 in 0.03 sec.
2025-11-14 17:56:11,314 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,328 - INFO - Going to convert document batch...
2025-11-14 17:56:11,329 - INFO - Processing document 8-K_2024-10-18
2025-11-14 17:56:11,353 - INFO - Finished converting document 8-K_2024-10-18 in 0.05 sec.
2025-11-14 17:56:11,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,404 - INFO - Going to convert document batch...
2025-11-14 17:56:11,405 - INFO - Processing document 8-K_2024-11-19
2025-11-14 17:56:11,435 - INFO - Finished converting document 8-K_2024-11-19 in 0.06 sec.


Converted 'data\edgar_documents\WMT\8-K_2024-08-15' --> 'data\processed_data\WMT\8-K_2024-08-15.md'
Converted 'data\edgar_documents\WMT\8-K_2024-09-06' --> 'data\processed_data\WMT\8-K_2024-09-06.md'
Converted 'data\edgar_documents\WMT\8-K_2024-10-18' --> 'data\processed_data\WMT\8-K_2024-10-18.md'


2025-11-14 17:56:11,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,474 - INFO - Going to convert document batch...
2025-11-14 17:56:11,475 - INFO - Processing document 8-K_2024-11-22
2025-11-14 17:56:11,494 - INFO - Finished converting document 8-K_2024-11-22 in 0.05 sec.
2025-11-14 17:56:11,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,536 - INFO - Going to convert document batch...
2025-11-14 17:56:11,537 - INFO - Processing document 8-K_2025-02-20
2025-11-14 17:56:11,573 - INFO - Finished converting document 8-K_2025-02-20 in 0.08 sec.
2025-11-14 17:56:11,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,622 - INFO - Going to convert document batch...
2025-11-14 17:56:11,623 - INFO - Processing document 8-K_2025-03-17


Converted 'data\edgar_documents\WMT\8-K_2024-11-19' --> 'data\processed_data\WMT\8-K_2024-11-19.md'
Converted 'data\edgar_documents\WMT\8-K_2024-11-22' --> 'data\processed_data\WMT\8-K_2024-11-22.md'
Converted 'data\edgar_documents\WMT\8-K_2025-02-20' --> 'data\processed_data\WMT\8-K_2025-02-20.md'


2025-11-14 17:56:11,643 - INFO - Finished converting document 8-K_2025-03-17 in 0.05 sec.
2025-11-14 17:56:11,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,685 - INFO - Going to convert document batch...
2025-11-14 17:56:11,686 - INFO - Processing document 8-K_2025-04-09
2025-11-14 17:56:11,706 - INFO - Finished converting document 8-K_2025-04-09 in 0.05 sec.
2025-11-14 17:56:11,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,753 - INFO - Going to convert document batch...
2025-11-14 17:56:11,753 - INFO - Processing document 8-K_2025-04-28
2025-11-14 17:56:11,784 - INFO - Finished converting document 8-K_2025-04-28 in 0.06 sec.
2025-11-14 17:56:11,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,829 - INFO - Going to convert document batch...
2025-11-14 17:56:11,829 - INFO - Processing document 8-K_2025-05-15
2025-11-14 17:56:11,848 - INFO - Finished converting document 8-K_2025-05-15 in 0.

Converted 'data\edgar_documents\WMT\8-K_2025-03-17' --> 'data\processed_data\WMT\8-K_2025-03-17.md'
Converted 'data\edgar_documents\WMT\8-K_2025-04-09' --> 'data\processed_data\WMT\8-K_2025-04-09.md'
Converted 'data\edgar_documents\WMT\8-K_2025-04-28' --> 'data\processed_data\WMT\8-K_2025-04-28.md'


2025-11-14 17:56:11,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,894 - INFO - Going to convert document batch...
2025-11-14 17:56:11,896 - INFO - Processing document 8-K_2025-06-06
2025-11-14 17:56:11,944 - INFO - Finished converting document 8-K_2025-06-06 in 0.08 sec.
2025-11-14 17:56:11,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:11,996 - INFO - Going to convert document batch...
2025-11-14 17:56:11,996 - INFO - Processing document 8-K_2025-08-21
2025-11-14 17:56:12,015 - INFO - Finished converting document 8-K_2025-08-21 in 0.05 sec.
2025-11-14 17:56:12,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:12,050 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\WMT\8-K_2025-05-15' --> 'data\processed_data\WMT\8-K_2025-05-15.md'
Converted 'data\edgar_documents\WMT\8-K_2025-06-06' --> 'data\processed_data\WMT\8-K_2025-06-06.md'
Converted 'data\edgar_documents\WMT\8-K_2025-08-21' --> 'data\processed_data\WMT\8-K_2025-08-21.md'


2025-11-14 17:56:12,051 - INFO - Processing document 8-K_2025-09-05
2025-11-14 17:56:12,066 - INFO - Finished converting document 8-K_2025-09-05 in 0.03 sec.
2025-11-14 17:56:12,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:12,097 - INFO - Going to convert document batch...
2025-11-14 17:56:12,098 - INFO - Processing document 8-K_2025-09-19
2025-11-14 17:56:12,115 - INFO - Finished converting document 8-K_2025-09-19 in 0.03 sec.
2025-11-14 17:56:12,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:12,145 - INFO - Going to convert document batch...
2025-11-14 17:56:12,146 - INFO - Processing document 8-K_2025-09-22
2025-11-14 17:56:12,174 - INFO - Finished converting document 8-K_2025-09-22 in 0.05 sec.
2025-11-14 17:56:12,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:56:12,234 - INFO - Going to convert document batch...
2025-11-14 17:56:12,235 - INFO - Processing document 8-K_2025-10-22
2025-11-14 17:

Converted 'data\edgar_documents\WMT\8-K_2025-09-05' --> 'data\processed_data\WMT\8-K_2025-09-05.md'
Converted 'data\edgar_documents\WMT\8-K_2025-09-19' --> 'data\processed_data\WMT\8-K_2025-09-19.md'
Converted 'data\edgar_documents\WMT\8-K_2025-09-22' --> 'data\processed_data\WMT\8-K_2025-09-22.md'


2025-11-14 17:56:12,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\8-K_2025-10-22' --> 'data\processed_data\WMT\8-K_2025-10-22.md'


2025-11-14 17:56:13,029 - INFO - Going to convert document batch...
2025-11-14 17:56:13,030 - INFO - Processing document DEF-14A_2023-04-20
2025-11-14 17:56:17,385 - INFO - Finished converting document DEF-14A_2023-04-20 in 5.11 sec.
2025-11-14 17:56:18,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\DEF-14A_2023-04-20' --> 'data\processed_data\WMT\DEF-14A_2023-04-20.md'


2025-11-14 17:56:19,275 - INFO - Going to convert document batch...
2025-11-14 17:56:19,275 - INFO - Processing document DEF-14A_2024-04-25
2025-11-14 17:56:23,675 - INFO - Finished converting document DEF-14A_2024-04-25 in 4.98 sec.
2025-11-14 17:56:25,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\DEF-14A_2024-04-25' --> 'data\processed_data\WMT\DEF-14A_2024-04-25.md'


2025-11-14 17:56:25,923 - INFO - Going to convert document batch...
2025-11-14 17:56:25,924 - INFO - Processing document DEF-14A_2025-04-24
2025-11-14 17:56:31,489 - INFO - Finished converting document DEF-14A_2025-04-24 in 6.17 sec.
2025-11-14 17:56:33,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\WMT\DEF-14A_2025-04-24' --> 'data\processed_data\WMT\DEF-14A_2025-04-24.md'
Processed 251 new files. Errors: 3
Found 120 files to process in data\edgar_documents\XOM


2025-11-14 17:56:35,437 - INFO - Going to convert document batch...
2025-11-14 17:56:35,438 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 17:56:35,439 - INFO - Processing document 10-K_2023-02-22
2025-11-14 17:56:38,719 - INFO - Finished converting document 10-K_2023-02-22 in 5.19 sec.
2025-11-14 17:56:40,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-K_2023-02-22' --> 'data\processed_data\XOM\10-K_2023-02-22.md'


2025-11-14 17:56:42,556 - INFO - Going to convert document batch...
2025-11-14 17:56:42,557 - INFO - Processing document 10-K_2024-02-28
2025-11-14 17:56:45,793 - INFO - Finished converting document 10-K_2024-02-28 in 5.02 sec.
2025-11-14 17:56:47,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-K_2024-02-28' --> 'data\processed_data\XOM\10-K_2024-02-28.md'


2025-11-14 17:56:49,811 - INFO - Going to convert document batch...
2025-11-14 17:56:49,812 - INFO - Processing document 10-K_2025-02-19
2025-11-14 17:56:53,789 - INFO - Finished converting document 10-K_2025-02-19 in 6.22 sec.
2025-11-14 17:56:55,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-K_2025-02-19' --> 'data\processed_data\XOM\10-K_2025-02-19.md'


2025-11-14 17:56:56,112 - INFO - Going to convert document batch...
2025-11-14 17:56:56,113 - INFO - Processing document 10-Q_2023-05-02
2025-11-14 17:56:56,672 - INFO - Finished converting document 10-Q_2023-05-02 in 0.98 sec.
2025-11-14 17:56:57,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-Q_2023-05-02' --> 'data\processed_data\XOM\10-Q_2023-05-02.md'


2025-11-14 17:56:57,415 - INFO - Going to convert document batch...
2025-11-14 17:56:57,416 - INFO - Processing document 10-Q_2023-08-01
2025-11-14 17:56:58,151 - INFO - Finished converting document 10-Q_2023-08-01 in 1.11 sec.
2025-11-14 17:56:58,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-Q_2023-08-01' --> 'data\processed_data\XOM\10-Q_2023-08-01.md'


2025-11-14 17:56:59,689 - INFO - Going to convert document batch...
2025-11-14 17:56:59,690 - INFO - Processing document 10-Q_2023-10-31
2025-11-14 17:57:00,428 - INFO - Finished converting document 10-Q_2023-10-31 in 1.81 sec.
2025-11-14 17:57:00,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-Q_2023-10-31' --> 'data\processed_data\XOM\10-Q_2023-10-31.md'


2025-11-14 17:57:01,177 - INFO - Going to convert document batch...
2025-11-14 17:57:01,178 - INFO - Processing document 10-Q_2024-04-29
2025-11-14 17:57:01,791 - INFO - Finished converting document 10-Q_2024-04-29 in 0.89 sec.
2025-11-14 17:57:02,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-Q_2024-04-29' --> 'data\processed_data\XOM\10-Q_2024-04-29.md'


2025-11-14 17:57:02,839 - INFO - Going to convert document batch...
2025-11-14 17:57:02,839 - INFO - Processing document 10-Q_2024-08-05
2025-11-14 17:57:03,607 - INFO - Finished converting document 10-Q_2024-08-05 in 1.44 sec.
2025-11-14 17:57:04,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-Q_2024-08-05' --> 'data\processed_data\XOM\10-Q_2024-08-05.md'


2025-11-14 17:57:04,469 - INFO - Going to convert document batch...
2025-11-14 17:57:04,470 - INFO - Processing document 10-Q_2024-11-04
2025-11-14 17:57:05,179 - INFO - Finished converting document 10-Q_2024-11-04 in 1.08 sec.
2025-11-14 17:57:05,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-Q_2024-11-04' --> 'data\processed_data\XOM\10-Q_2024-11-04.md'


2025-11-14 17:57:06,222 - INFO - Going to convert document batch...
2025-11-14 17:57:06,222 - INFO - Processing document 10-Q_2025-05-05
2025-11-14 17:57:06,884 - INFO - Finished converting document 10-Q_2025-05-05 in 1.27 sec.
2025-11-14 17:57:07,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-Q_2025-05-05' --> 'data\processed_data\XOM\10-Q_2025-05-05.md'


2025-11-14 17:57:07,805 - INFO - Going to convert document batch...
2025-11-14 17:57:07,806 - INFO - Processing document 10-Q_2025-08-04
2025-11-14 17:57:08,672 - INFO - Finished converting document 10-Q_2025-08-04 in 1.34 sec.
2025-11-14 17:57:09,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\10-Q_2025-08-04' --> 'data\processed_data\XOM\10-Q_2025-08-04.md'


2025-11-14 17:57:10,101 - INFO - Going to convert document batch...
2025-11-14 17:57:10,102 - INFO - Processing document 10-Q_2025-11-03
2025-11-14 17:57:11,002 - INFO - Finished converting document 10-Q_2025-11-03 in 1.41 sec.
2025-11-14 17:57:11,649 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:11,655 - INFO - Going to convert document batch...
2025-11-14 17:57:11,657 - INFO - Processing document 4_2023-01-04
2025-11-14 17:57:11,672 - INFO - Finished converting document 4_2023-01-04 in 0.03 sec.
2025-11-14 17:57:11,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:11,734 - INFO - Going to convert document batch...
2025-11-14 17:57:11,735 - INFO - Processing document 4_2023-01-05
2025-11-14 17:57:11,753 - INFO - Finished converting document 4_2023-01-05 in 0.06 sec.
2025-11-14 17:57:11,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:11,789 - INFO - Going to convert document batch...
2025-11-14 17:57:11,

Converted 'data\edgar_documents\XOM\10-Q_2025-11-03' --> 'data\processed_data\XOM\10-Q_2025-11-03.md'
Converted 'data\edgar_documents\XOM\4_2023-01-04' --> 'data\processed_data\XOM\4_2023-01-04.md'
Converted 'data\edgar_documents\XOM\4_2023-01-05' --> 'data\processed_data\XOM\4_2023-01-05.md'
Converted 'data\edgar_documents\XOM\4_2023-02-03' --> 'data\processed_data\XOM\4_2023-02-03.md'


2025-11-14 17:57:11,847 - INFO - Going to convert document batch...
2025-11-14 17:57:11,847 - INFO - Processing document 4_2023-05-03
2025-11-14 17:57:11,866 - INFO - Finished converting document 4_2023-05-03 in 0.03 sec.
2025-11-14 17:57:11,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:11,912 - INFO - Going to convert document batch...
2025-11-14 17:57:11,913 - INFO - Processing document 4_2023-06-01
2025-11-14 17:57:11,931 - INFO - Finished converting document 4_2023-06-01 in 0.03 sec.
2025-11-14 17:57:11,984 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:11,985 - ERROR - Input document 4_2023-07-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\XOM\4_2023-05-03' --> 'data\processed_data\XOM\4_2023-05-03.md'
Converted 'data\edgar_documents\XOM\4_2023-06-01' --> 'data\processed_data\XOM\4_2023-06-01.md'
Error processing data\edgar_documents\XOM\4_2023-07-13: File format not allowed: data\edgar_documents\XOM\4_2023-07-13
Error processing data\edgar_documents\XOM\4_2023-07-24: File format not allowed: data\edgar_documents\XOM\4_2023-07-24
Error processing data\edgar_documents\XOM\4_2023-07-28: File format not allowed: data\edgar_documents\XOM\4_2023-07-28


2025-11-14 17:57:12,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:12,121 - INFO - Going to convert document batch...
2025-11-14 17:57:12,122 - INFO - Processing document 4_2023-08-03
2025-11-14 17:57:12,146 - INFO - Finished converting document 4_2023-08-03 in 0.05 sec.
2025-11-14 17:57:12,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:12,190 - INFO - Going to convert document batch...
2025-11-14 17:57:12,191 - INFO - Processing document 4_2023-09-05
2025-11-14 17:57:12,212 - INFO - Finished converting document 4_2023-09-05 in 0.03 sec.


Converted 'data\edgar_documents\XOM\4_2023-08-02' --> 'data\processed_data\XOM\4_2023-08-02.md'
Converted 'data\edgar_documents\XOM\4_2023-08-03' --> 'data\processed_data\XOM\4_2023-08-03.md'
Converted 'data\edgar_documents\XOM\4_2023-09-05' --> 'data\processed_data\XOM\4_2023-09-05.md'


2025-11-14 17:57:12,324 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:12,325 - ERROR - Input document 4_2023-09-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:57:12,327 - INFO - Going to convert document batch...
2025-11-14 17:57:12,341 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:12,342 - ERROR - Input document 4_2023-10-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\XOM\4_2023-09-29: File format not allowed: data\edgar_documents\XOM\4_2023-09-29
Error processing data\edgar_documents\XOM\4_2023-10-11: File format not allowed: data\edgar_documents\XOM\4_2023-10-11
Error processing data\edgar_documents\XOM\4_2023-10-12: File format not allowed: data\edgar_documents\XOM\4_2023-10-12
Error processing data\edgar_documents\XOM\4_2023-10-18: File format not allowed: data\edgar_documents\XOM\4_2023-10-18
Error processing data\edgar_documents\XOM\4_2023-10-20: File format not allowed: data\edgar_documents\XOM\4_2023-10-20
Error processing data\edgar_documents\XOM\4_2023-10-27: File format not allowed: data\edgar_documents\XOM\4_2023-10-27
Error processing data\edgar_documents\XOM\4_2023-10-30: File format not allowed: data\edgar_documents\XOM\4_2023-10-30
Error processing data\edgar_documents\XOM\4_2023-10-31: File format not allowed: data\edgar_documents\XOM\4_2023-10-31


2025-11-14 17:57:12,575 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:12,575 - ERROR - Input document 4_2023-11-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:57:12,576 - INFO - Going to convert document batch...
2025-11-14 17:57:12,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:12,596 - INFO - Going to convert document batch...
2025-11-14 17:57:12,597 - INFO - Processing document 4_2023-11-28
2025-11-14 17:57:12,617 - INFO - Fin

Converted 'data\edgar_documents\XOM\4_2023-11-08' --> 'data\processed_data\XOM\4_2023-11-08.md'
Error processing data\edgar_documents\XOM\4_2023-11-13: File format not allowed: data\edgar_documents\XOM\4_2023-11-13
Converted 'data\edgar_documents\XOM\4_2023-11-28' --> 'data\processed_data\XOM\4_2023-11-28.md'
Converted 'data\edgar_documents\XOM\4_2023-11-30' --> 'data\processed_data\XOM\4_2023-11-30.md'


2025-11-14 17:57:12,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:12,793 - INFO - Going to convert document batch...
2025-11-14 17:57:12,794 - INFO - Processing document 4_2023-12-05
2025-11-14 17:57:12,814 - INFO - Finished converting document 4_2023-12-05 in 0.05 sec.
2025-11-14 17:57:12,848 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:12,849 - ERROR - Input document 4_2023-12-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:57

Converted 'data\edgar_documents\XOM\4_2023-12-01' --> 'data\processed_data\XOM\4_2023-12-01.md'
Converted 'data\edgar_documents\XOM\4_2023-12-05' --> 'data\processed_data\XOM\4_2023-12-05.md'
Error processing data\edgar_documents\XOM\4_2023-12-06: File format not allowed: data\edgar_documents\XOM\4_2023-12-06
Error processing data\edgar_documents\XOM\4_2023-12-11: File format not allowed: data\edgar_documents\XOM\4_2023-12-11
Converted 'data\edgar_documents\XOM\4_2023-12-19' --> 'data\processed_data\XOM\4_2023-12-19.md'


2025-11-14 17:57:12,962 - INFO - Finished converting document 4_2024-01-03 in 0.03 sec.
2025-11-14 17:57:12,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:13,003 - INFO - Going to convert document batch...
2025-11-14 17:57:13,004 - INFO - Processing document 4_2024-01-04
2025-11-14 17:57:13,027 - INFO - Finished converting document 4_2024-01-04 in 0.05 sec.
2025-11-14 17:57:13,082 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:13,082 - ERROR - Input document 4_2024-01-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\XOM\4_2024-01-03' --> 'data\processed_data\XOM\4_2024-01-03.md'
Converted 'data\edgar_documents\XOM\4_2024-01-04' --> 'data\processed_data\XOM\4_2024-01-04.md'
Error processing data\edgar_documents\XOM\4_2024-01-08: File format not allowed: data\edgar_documents\XOM\4_2024-01-08
Error processing data\edgar_documents\XOM\4_2024-02-02: File format not allowed: data\edgar_documents\XOM\4_2024-02-02


2025-11-14 17:57:13,444 - INFO - Going to convert document batch...
2025-11-14 17:57:13,445 - INFO - Processing document 4_2024-02-23
2025-11-14 17:57:13,463 - INFO - Finished converting document 4_2024-02-23 in 0.36 sec.
2025-11-14 17:57:13,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:13,519 - INFO - Going to convert document batch...
2025-11-14 17:57:13,520 - INFO - Processing document 4_2024-03-19
2025-11-14 17:57:13,538 - INFO - Finished converting document 4_2024-03-19 in 0.05 sec.
2025-11-14 17:57:13,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:13,577 - INFO - Going to convert document batch...
2025-11-14 17:57:13,578 - INFO - Processing document 4_2024-04-30
2025-11-14 17:57:13,598 - INFO - Finished converting document 4_2024-04-30 in 0.03 sec.
2025-11-14 17:57:13,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:13,636 - INFO - Going to convert document batch...
2025-11-14 17:57:13,636 - 

Converted 'data\edgar_documents\XOM\4_2024-02-23' --> 'data\processed_data\XOM\4_2024-02-23.md'
Converted 'data\edgar_documents\XOM\4_2024-03-19' --> 'data\processed_data\XOM\4_2024-03-19.md'
Converted 'data\edgar_documents\XOM\4_2024-04-30' --> 'data\processed_data\XOM\4_2024-04-30.md'


2025-11-14 17:57:13,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:13,692 - INFO - Going to convert document batch...
2025-11-14 17:57:13,693 - INFO - Processing document 4_2024-05-28
2025-11-14 17:57:13,714 - INFO - Finished converting document 4_2024-05-28 in 0.05 sec.
2025-11-14 17:57:13,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:13,754 - INFO - Going to convert document batch...
2025-11-14 17:57:13,755 - INFO - Processing document 4_2024-05-29
2025-11-14 17:57:13,770 - INFO - Finished converting document 4_2024-05-29 in 0.03 sec.
2025-11-14 17:57:13,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:13,807 - INFO - Going to convert document batch...
2025-11-14 17:57:13,808 - INFO - Processing document 4_2024-06-20
2025-11-14 17:57:13,827 - INFO - Finished converting document 4_2024-06-20 in 0.05 sec.
2025-11-14 17:57:13,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\4_2024-05-07' --> 'data\processed_data\XOM\4_2024-05-07.md'
Converted 'data\edgar_documents\XOM\4_2024-05-28' --> 'data\processed_data\XOM\4_2024-05-28.md'
Converted 'data\edgar_documents\XOM\4_2024-05-29' --> 'data\processed_data\XOM\4_2024-05-29.md'
Converted 'data\edgar_documents\XOM\4_2024-06-20' --> 'data\processed_data\XOM\4_2024-06-20.md'


2025-11-14 17:57:13,866 - INFO - Going to convert document batch...
2025-11-14 17:57:13,867 - INFO - Processing document 4_2024-06-26
2025-11-14 17:57:13,888 - INFO - Finished converting document 4_2024-06-26 in 0.05 sec.
2025-11-14 17:57:13,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:13,928 - INFO - Going to convert document batch...
2025-11-14 17:57:13,929 - INFO - Processing document 4_2024-07-01
2025-11-14 17:57:13,946 - INFO - Finished converting document 4_2024-07-01 in 0.03 sec.
2025-11-14 17:57:13,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:13,987 - INFO - Going to convert document batch...
2025-11-14 17:57:13,987 - INFO - Processing document 4_2024-08-14
2025-11-14 17:57:14,007 - INFO - Finished converting document 4_2024-08-14 in 0.03 sec.
2025-11-14 17:57:14,045 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:14,046 - ERROR - Input document 4_2024-09-30 with format None does 

Converted 'data\edgar_documents\XOM\4_2024-06-26' --> 'data\processed_data\XOM\4_2024-06-26.md'
Converted 'data\edgar_documents\XOM\4_2024-07-01' --> 'data\processed_data\XOM\4_2024-07-01.md'
Converted 'data\edgar_documents\XOM\4_2024-08-14' --> 'data\processed_data\XOM\4_2024-08-14.md'
Error processing data\edgar_documents\XOM\4_2024-09-30: File format not allowed: data\edgar_documents\XOM\4_2024-09-30
Error processing data\edgar_documents\XOM\4_2024-10-07: File format not allowed: data\edgar_documents\XOM\4_2024-10-07


2025-11-14 17:57:14,100 - INFO - Finished converting document 4_2024-10-21 in 0.03 sec.
2025-11-14 17:57:14,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,159 - INFO - Going to convert document batch...
2025-11-14 17:57:14,160 - INFO - Processing document 4_2024-11-27
2025-11-14 17:57:14,186 - INFO - Finished converting document 4_2024-11-27 in 0.08 sec.
2025-11-14 17:57:14,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,225 - INFO - Going to convert document batch...
2025-11-14 17:57:14,227 - INFO - Processing document 4_2024-12-02
2025-11-14 17:57:14,246 - INFO - Finished converting document 4_2024-12-02 in 0.05 sec.
2025-11-14 17:57:14,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,287 - INFO - Going to convert document batch...
2025-11-14 17:57:14,288 - INFO - Processing document 4_2024-12-16
2025-11-14 17:57:14,305 - INFO - Finished converting document 4_2024-12-16 in 0.03 sec.


Converted 'data\edgar_documents\XOM\4_2024-10-21' --> 'data\processed_data\XOM\4_2024-10-21.md'
Converted 'data\edgar_documents\XOM\4_2024-11-27' --> 'data\processed_data\XOM\4_2024-11-27.md'
Converted 'data\edgar_documents\XOM\4_2024-12-02' --> 'data\processed_data\XOM\4_2024-12-02.md'


2025-11-14 17:57:14,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,347 - INFO - Going to convert document batch...
2025-11-14 17:57:14,348 - INFO - Processing document 4_2024-12-18
2025-11-14 17:57:14,375 - INFO - Finished converting document 4_2024-12-18 in 0.05 sec.
2025-11-14 17:57:14,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,435 - INFO - Going to convert document batch...
2025-11-14 17:57:14,435 - INFO - Processing document 4_2025-01-03
2025-11-14 17:57:14,454 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 17:57:14,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,496 - INFO - Going to convert document batch...
2025-11-14 17:57:14,497 - INFO - Processing document 4_2025-02-03
2025-11-14 17:57:14,514 - INFO - Finished converting document 4_2025-02-03 in 0.05 sec.


Converted 'data\edgar_documents\XOM\4_2024-12-16' --> 'data\processed_data\XOM\4_2024-12-16.md'
Converted 'data\edgar_documents\XOM\4_2024-12-18' --> 'data\processed_data\XOM\4_2024-12-18.md'
Converted 'data\edgar_documents\XOM\4_2025-01-03' --> 'data\processed_data\XOM\4_2025-01-03.md'


2025-11-14 17:57:14,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,554 - INFO - Going to convert document batch...
2025-11-14 17:57:14,555 - INFO - Processing document 4_2025-02-05
2025-11-14 17:57:14,579 - INFO - Finished converting document 4_2025-02-05 in 0.05 sec.
2025-11-14 17:57:14,614 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,637 - INFO - Going to convert document batch...
2025-11-14 17:57:14,638 - INFO - Processing document 4_2025-03-18
2025-11-14 17:57:14,671 - INFO - Finished converting document 4_2025-03-18 in 0.08 sec.
2025-11-14 17:57:14,708 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:14,708 - ERROR - Input document 4_2025-03-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\XOM\4_2025-02-03' --> 'data\processed_data\XOM\4_2025-02-03.md'
Converted 'data\edgar_documents\XOM\4_2025-02-05' --> 'data\processed_data\XOM\4_2025-02-05.md'
Converted 'data\edgar_documents\XOM\4_2025-03-18' --> 'data\processed_data\XOM\4_2025-03-18.md'
Error processing data\edgar_documents\XOM\4_2025-03-24: File format not allowed: data\edgar_documents\XOM\4_2025-03-24


2025-11-14 17:57:14,726 - ERROR - Input document 4_2025-03-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:57:14,727 - INFO - Going to convert document batch...
2025-11-14 17:57:14,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,747 - INFO - Going to convert document batch...
2025-11-14 17:57:14,748 - INFO - Processing document 4_2025-05-01
2025-11-14 17:57:14,764 - INFO - Finished converting document 4_2025-05-01 in 0.05 sec.
2025-11-14 17:57:14,797 - INFO - detec

Error processing data\edgar_documents\XOM\4_2025-03-31: File format not allowed: data\edgar_documents\XOM\4_2025-03-31
Converted 'data\edgar_documents\XOM\4_2025-05-01' --> 'data\processed_data\XOM\4_2025-05-01.md'
Converted 'data\edgar_documents\XOM\4_2025-05-06' --> 'data\processed_data\XOM\4_2025-05-06.md'
Converted 'data\edgar_documents\XOM\4_2025-08-25' --> 'data\processed_data\XOM\4_2025-08-25.md'


2025-11-14 17:57:14,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:14,944 - INFO - Going to convert document batch...
2025-11-14 17:57:14,944 - INFO - Processing document 4_2025-11-04
2025-11-14 17:57:14,963 - INFO - Finished converting document 4_2025-11-04 in 0.06 sec.
2025-11-14 17:57:15,016 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:15,016 - ERROR - Input document 4_2025-11-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:57

Converted 'data\edgar_documents\XOM\4_2025-11-04' --> 'data\processed_data\XOM\4_2025-11-04.md'
Error processing data\edgar_documents\XOM\4_2025-11-05: File format not allowed: data\edgar_documents\XOM\4_2025-11-05
Converted 'data\edgar_documents\XOM\8-K_2023-01-04' --> 'data\processed_data\XOM\8-K_2023-01-04.md'
Converted 'data\edgar_documents\XOM\8-K_2023-01-26' --> 'data\processed_data\XOM\8-K_2023-01-26.md'


2025-11-14 17:57:15,184 - INFO - Finished converting document 8-K_2023-01-31 in 0.06 sec.
2025-11-14 17:57:15,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:15,221 - INFO - Going to convert document batch...
2025-11-14 17:57:15,221 - INFO - Processing document 8-K_2023-02-24
2025-11-14 17:57:15,240 - INFO - Finished converting document 8-K_2023-02-24 in 0.05 sec.
2025-11-14 17:57:15,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:15,282 - INFO - Going to convert document batch...
2025-11-14 17:57:15,282 - INFO - Processing document 8-K_2023-04-04
2025-11-14 17:57:15,302 - INFO - Finished converting document 8-K_2023-04-04 in 0.05 sec.
2025-11-14 17:57:15,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:15,343 - INFO - Going to convert document batch...
2025-11-14 17:57:15,344 - INFO - Processing document 8-K_2023-04-28
2025-11-14 17:57:15,365 - INFO - Finished converting document 8-K_2023-04-28 in 0.

Converted 'data\edgar_documents\XOM\8-K_2023-01-31' --> 'data\processed_data\XOM\8-K_2023-01-31.md'
Converted 'data\edgar_documents\XOM\8-K_2023-02-24' --> 'data\processed_data\XOM\8-K_2023-02-24.md'
Converted 'data\edgar_documents\XOM\8-K_2023-04-04' --> 'data\processed_data\XOM\8-K_2023-04-04.md'


2025-11-14 17:57:15,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:15,439 - INFO - Going to convert document batch...
2025-11-14 17:57:15,440 - INFO - Processing document 8-K_2023-06-06
2025-11-14 17:57:15,534 - INFO - Finished converting document 8-K_2023-06-06 in 0.16 sec.


Converted 'data\edgar_documents\XOM\8-K_2023-04-28' --> 'data\processed_data\XOM\8-K_2023-04-28.md'


2025-11-14 17:57:15,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:15,628 - INFO - Going to convert document batch...
2025-11-14 17:57:15,629 - INFO - Processing document 8-K_2023-07-05
2025-11-14 17:57:15,648 - INFO - Finished converting document 8-K_2023-07-05 in 0.05 sec.
2025-11-14 17:57:15,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:15,688 - INFO - Going to convert document batch...
2025-11-14 17:57:15,689 - INFO - Processing document 8-K_2023-07-13
2025-11-14 17:57:15,723 - INFO - Finished converting document 8-K_2023-07-13 in 0.06 sec.
2025-11-14 17:57:15,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:15,776 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\XOM\8-K_2023-06-06' --> 'data\processed_data\XOM\8-K_2023-06-06.md'
Converted 'data\edgar_documents\XOM\8-K_2023-07-05' --> 'data\processed_data\XOM\8-K_2023-07-05.md'
Converted 'data\edgar_documents\XOM\8-K_2023-07-13' --> 'data\processed_data\XOM\8-K_2023-07-13.md'


2025-11-14 17:57:15,777 - INFO - Processing document 8-K_2023-07-28
2025-11-14 17:57:15,798 - INFO - Finished converting document 8-K_2023-07-28 in 0.05 sec.
2025-11-14 17:57:15,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:15,841 - INFO - Going to convert document batch...
2025-11-14 17:57:15,842 - INFO - Processing document 8-K_2023-10-04
2025-11-14 17:57:15,863 - INFO - Finished converting document 8-K_2023-10-04 in 0.05 sec.
2025-11-14 17:57:15,888 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:15,904 - INFO - Going to convert document batch...
2025-11-14 17:57:15,904 - INFO - Processing document 8-K_2023-10-11
2025-11-14 17:57:15,948 - INFO - Finished converting document 8-K_2023-10-11 in 0.08 sec.


Converted 'data\edgar_documents\XOM\8-K_2023-07-28' --> 'data\processed_data\XOM\8-K_2023-07-28.md'
Converted 'data\edgar_documents\XOM\8-K_2023-10-04' --> 'data\processed_data\XOM\8-K_2023-10-04.md'
Converted 'data\edgar_documents\XOM\8-K_2023-10-11' --> 'data\processed_data\XOM\8-K_2023-10-11.md'


2025-11-14 17:57:16,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,036 - INFO - Going to convert document batch...
2025-11-14 17:57:16,037 - INFO - Processing document 8-K_2023-10-20
2025-11-14 17:57:16,055 - INFO - Finished converting document 8-K_2023-10-20 in 0.06 sec.
2025-11-14 17:57:16,079 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,096 - INFO - Going to convert document batch...
2025-11-14 17:57:16,097 - INFO - Processing document 8-K_2023-10-27
2025-11-14 17:57:16,120 - INFO - Finished converting document 8-K_2023-10-27 in 0.06 sec.
2025-11-14 17:57:16,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,155 - INFO - Going to convert document batch...
2025-11-14 17:57:16,156 - INFO - Processing document 8-K_2023-11-02
2025-11-14 17:57:16,173 - INFO - Finished converting document 8-K_2023-11-02 in 0.05 sec.
2025-11-14 17:57:16,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\XOM\8-K_2023-10-20' --> 'data\processed_data\XOM\8-K_2023-10-20.md'
Converted 'data\edgar_documents\XOM\8-K_2023-10-27' --> 'data\processed_data\XOM\8-K_2023-10-27.md'
Converted 'data\edgar_documents\XOM\8-K_2023-11-02' --> 'data\processed_data\XOM\8-K_2023-11-02.md'
Converted 'data\edgar_documents\XOM\8-K_2023-11-07' --> 'data\processed_data\XOM\8-K_2023-11-07.md'


2025-11-14 17:57:16,265 - INFO - Going to convert document batch...
2025-11-14 17:57:16,266 - INFO - Processing document 8-K_2023-11-15
2025-11-14 17:57:16,282 - INFO - Finished converting document 8-K_2023-11-15 in 0.05 sec.
2025-11-14 17:57:16,309 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,323 - INFO - Going to convert document batch...
2025-11-14 17:57:16,324 - INFO - Processing document 8-K_2023-12-06
2025-11-14 17:57:16,355 - INFO - Finished converting document 8-K_2023-12-06 in 0.06 sec.
2025-11-14 17:57:16,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,437 - INFO - Going to convert document batch...
2025-11-14 17:57:16,439 - INFO - Processing document 8-K_2024-01-04
2025-11-14 17:57:16,470 - INFO - Finished converting document 8-K_2024-01-04 in 0.08 sec.


Converted 'data\edgar_documents\XOM\8-K_2023-11-15' --> 'data\processed_data\XOM\8-K_2023-11-15.md'
Converted 'data\edgar_documents\XOM\8-K_2023-12-06' --> 'data\processed_data\XOM\8-K_2023-12-06.md'


2025-11-14 17:57:16,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,505 - INFO - Going to convert document batch...
2025-11-14 17:57:16,505 - INFO - Processing document 8-K_2024-02-02
2025-11-14 17:57:16,527 - INFO - Finished converting document 8-K_2024-02-02 in 0.05 sec.
2025-11-14 17:57:16,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,565 - INFO - Going to convert document batch...
2025-11-14 17:57:16,566 - INFO - Processing document 8-K_2024-02-28
2025-11-14 17:57:16,587 - INFO - Finished converting document 8-K_2024-02-28 in 0.05 sec.
2025-11-14 17:57:16,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,624 - INFO - Going to convert document batch...
2025-11-14 17:57:16,624 - INFO - Processing document 8-K_2024-04-03
2025-11-14 17:57:16,645 - INFO - Finished converting document 8-K_2024-04-03 in 0.05 sec.
2025-11-14 17:57:16,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\8-K_2024-01-04' --> 'data\processed_data\XOM\8-K_2024-01-04.md'
Converted 'data\edgar_documents\XOM\8-K_2024-02-02' --> 'data\processed_data\XOM\8-K_2024-02-02.md'
Converted 'data\edgar_documents\XOM\8-K_2024-02-28' --> 'data\processed_data\XOM\8-K_2024-02-28.md'
Converted 'data\edgar_documents\XOM\8-K_2024-04-03' --> 'data\processed_data\XOM\8-K_2024-04-03.md'


2025-11-14 17:57:16,677 - INFO - Going to convert document batch...
2025-11-14 17:57:16,678 - INFO - Processing document 8-K_2024-04-26
2025-11-14 17:57:16,699 - INFO - Finished converting document 8-K_2024-04-26 in 0.05 sec.
2025-11-14 17:57:16,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,742 - INFO - Going to convert document batch...
2025-11-14 17:57:16,743 - INFO - Processing document 8-K_2024-05-03
2025-11-14 17:57:16,783 - INFO - Finished converting document 8-K_2024-05-03 in 0.08 sec.
2025-11-14 17:57:16,844 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,862 - INFO - Going to convert document batch...
2025-11-14 17:57:16,863 - INFO - Processing document 8-K_2024-05-10
2025-11-14 17:57:16,887 - INFO - Finished converting document 8-K_2024-05-10 in 0.08 sec.


Converted 'data\edgar_documents\XOM\8-K_2024-04-26' --> 'data\processed_data\XOM\8-K_2024-04-26.md'
Converted 'data\edgar_documents\XOM\8-K_2024-05-03' --> 'data\processed_data\XOM\8-K_2024-05-03.md'


2025-11-14 17:57:16,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:16,941 - INFO - Going to convert document batch...
2025-11-14 17:57:16,941 - INFO - Processing document 8-K_2024-05-31
2025-11-14 17:57:16,993 - INFO - Finished converting document 8-K_2024-05-31 in 0.08 sec.
2025-11-14 17:57:17,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,042 - INFO - Going to convert document batch...
2025-11-14 17:57:17,043 - INFO - Processing document 8-K_2024-07-08
2025-11-14 17:57:17,063 - INFO - Finished converting document 8-K_2024-07-08 in 0.05 sec.
2025-11-14 17:57:17,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,093 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\XOM\8-K_2024-05-10' --> 'data\processed_data\XOM\8-K_2024-05-10.md'
Converted 'data\edgar_documents\XOM\8-K_2024-05-31' --> 'data\processed_data\XOM\8-K_2024-05-31.md'
Converted 'data\edgar_documents\XOM\8-K_2024-07-08' --> 'data\processed_data\XOM\8-K_2024-07-08.md'


2025-11-14 17:57:17,094 - INFO - Processing document 8-K_2024-08-01
2025-11-14 17:57:17,109 - INFO - Finished converting document 8-K_2024-08-01 in 0.03 sec.
2025-11-14 17:57:17,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\XOM\8-K_2024-08-01' --> 'data\processed_data\XOM\8-K_2024-08-01.md'


2025-11-14 17:57:17,384 - INFO - Going to convert document batch...
2025-11-14 17:57:17,387 - INFO - Processing document 8-K_2024-08-02
2025-11-14 17:57:17,407 - INFO - Finished converting document 8-K_2024-08-02 in 0.28 sec.
2025-11-14 17:57:17,432 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,445 - INFO - Going to convert document batch...
2025-11-14 17:57:17,446 - INFO - Processing document 8-K_2024-10-03
2025-11-14 17:57:17,469 - INFO - Finished converting document 8-K_2024-10-03 in 0.05 sec.
2025-11-14 17:57:17,492 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,505 - INFO - Going to convert document batch...
2025-11-14 17:57:17,506 - INFO - Processing document 8-K_2024-10-08
2025-11-14 17:57:17,528 - INFO - Finished converting document 8-K_2024-10-08 in 0.06 sec.
2025-11-14 17:57:17,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,563 - INFO - Going to convert document batch...
2025-11-14 17:

Converted 'data\edgar_documents\XOM\8-K_2024-08-02' --> 'data\processed_data\XOM\8-K_2024-08-02.md'
Converted 'data\edgar_documents\XOM\8-K_2024-10-03' --> 'data\processed_data\XOM\8-K_2024-10-03.md'
Converted 'data\edgar_documents\XOM\8-K_2024-10-08' --> 'data\processed_data\XOM\8-K_2024-10-08.md'
Converted 'data\edgar_documents\XOM\8-K_2024-10-18' --> 'data\processed_data\XOM\8-K_2024-10-18.md'


2025-11-14 17:57:17,615 - INFO - Processing document 8-K_2024-11-01
2025-11-14 17:57:17,635 - INFO - Finished converting document 8-K_2024-11-01 in 0.05 sec.
2025-11-14 17:57:17,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,675 - INFO - Going to convert document batch...
2025-11-14 17:57:17,676 - INFO - Processing document 8-K_2024-11-12
2025-11-14 17:57:17,693 - INFO - Finished converting document 8-K_2024-11-12 in 0.05 sec.
2025-11-14 17:57:17,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,729 - INFO - Going to convert document batch...
2025-11-14 17:57:17,729 - INFO - Processing document 8-K_2025-01-07
2025-11-14 17:57:17,749 - INFO - Finished converting document 8-K_2025-01-07 in 0.05 sec.
2025-11-14 17:57:17,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,782 - INFO - Going to convert document batch...
2025-11-14 17:57:17,783 - INFO - Processing document 8-K_2025-01-31
2025-11-14 17:

Converted 'data\edgar_documents\XOM\8-K_2024-11-01' --> 'data\processed_data\XOM\8-K_2024-11-01.md'
Converted 'data\edgar_documents\XOM\8-K_2024-11-12' --> 'data\processed_data\XOM\8-K_2024-11-12.md'
Converted 'data\edgar_documents\XOM\8-K_2025-01-07' --> 'data\processed_data\XOM\8-K_2025-01-07.md'
Converted 'data\edgar_documents\XOM\8-K_2025-01-31' --> 'data\processed_data\XOM\8-K_2025-01-31.md'


2025-11-14 17:57:17,837 - INFO - Going to convert document batch...
2025-11-14 17:57:17,838 - INFO - Processing document 8-K_2025-04-01
2025-11-14 17:57:17,862 - INFO - Finished converting document 8-K_2025-04-01 in 0.05 sec.
2025-11-14 17:57:17,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,912 - INFO - Going to convert document batch...
2025-11-14 17:57:17,915 - INFO - Processing document 8-K_2025-04-03
2025-11-14 17:57:17,950 - INFO - Finished converting document 8-K_2025-04-03 in 0.08 sec.
2025-11-14 17:57:17,981 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:17,995 - INFO - Going to convert document batch...
2025-11-14 17:57:17,996 - INFO - Processing document 8-K_2025-05-02
2025-11-14 17:57:18,018 - INFO - Finished converting document 8-K_2025-05-02 in 0.05 sec.
2025-11-14 17:57:18,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:18,061 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\XOM\8-K_2025-04-01' --> 'data\processed_data\XOM\8-K_2025-04-01.md'
Converted 'data\edgar_documents\XOM\8-K_2025-04-03' --> 'data\processed_data\XOM\8-K_2025-04-03.md'
Converted 'data\edgar_documents\XOM\8-K_2025-05-02' --> 'data\processed_data\XOM\8-K_2025-05-02.md'


2025-11-14 17:57:18,062 - INFO - Processing document 8-K_2025-05-30
2025-11-14 17:57:18,099 - INFO - Finished converting document 8-K_2025-05-30 in 0.06 sec.
2025-11-14 17:57:18,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:18,142 - INFO - Going to convert document batch...
2025-11-14 17:57:18,143 - INFO - Processing document 8-K_2025-07-07
2025-11-14 17:57:18,163 - INFO - Finished converting document 8-K_2025-07-07 in 0.05 sec.
2025-11-14 17:57:18,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:18,195 - INFO - Going to convert document batch...
2025-11-14 17:57:18,196 - INFO - Processing document 8-K_2025-08-01
2025-11-14 17:57:18,215 - INFO - Finished converting document 8-K_2025-08-01 in 0.05 sec.
2025-11-14 17:57:18,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:18,251 - INFO - Going to convert document batch...
2025-11-14 17:57:18,252 - INFO - Processing document 8-K_2025-10-06
2025-11-14 17:

Converted 'data\edgar_documents\XOM\8-K_2025-05-30' --> 'data\processed_data\XOM\8-K_2025-05-30.md'
Converted 'data\edgar_documents\XOM\8-K_2025-07-07' --> 'data\processed_data\XOM\8-K_2025-07-07.md'
Converted 'data\edgar_documents\XOM\8-K_2025-08-01' --> 'data\processed_data\XOM\8-K_2025-08-01.md'
Converted 'data\edgar_documents\XOM\8-K_2025-10-06' --> 'data\processed_data\XOM\8-K_2025-10-06.md'


2025-11-14 17:57:18,303 - INFO - Going to convert document batch...
2025-11-14 17:57:18,304 - INFO - Processing document 8-K_2025-10-31
2025-11-14 17:57:18,326 - INFO - Finished converting document 8-K_2025-10-31 in 0.05 sec.
2025-11-14 17:57:18,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 17:57:18,382 - INFO - Going to convert document batch...
2025-11-14 17:57:18,383 - INFO - Processing document 8-K_2025-11-03
2025-11-14 17:57:18,406 - INFO - Finished converting document 8-K_2025-11-03 in 0.06 sec.
2025-11-14 17:57:18,466 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:18,467 - ERROR - Input document DEF-14A_2023-04-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputForm

Converted 'data\edgar_documents\XOM\8-K_2025-10-31' --> 'data\processed_data\XOM\8-K_2025-10-31.md'
Converted 'data\edgar_documents\XOM\8-K_2025-11-03' --> 'data\processed_data\XOM\8-K_2025-11-03.md'
Error processing data\edgar_documents\XOM\DEF-14A_2023-04-13: File format not allowed: data\edgar_documents\XOM\DEF-14A_2023-04-13


2025-11-14 17:57:18,527 - ERROR - Input document DEF-14A_2024-04-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 17:57:18,529 - INFO - Going to convert document batch...
2025-11-14 17:57:18,562 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 17:57:18,563 - ERROR - Input document DEF-14A_2025-04-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: '

Error processing data\edgar_documents\XOM\DEF-14A_2024-04-11: File format not allowed: data\edgar_documents\XOM\DEF-14A_2024-04-11
Error processing data\edgar_documents\XOM\DEF-14A_2025-04-07: File format not allowed: data\edgar_documents\XOM\DEF-14A_2025-04-07
Processed 96 new files. Errors: 24


In [3]:
# process the edgar documents
import os

crawl_dir = 'data/reuters_news'
processed_dir = 'data/processed_data/company_news'

process_files(crawl_dir=crawl_dir, processed_dir=processed_dir)

2025-11-24 11:24:32,131 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:32,154 - INFO - Going to convert document batch...
2025-11-24 11:24:32,157 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-24 11:24:32,223 - INFO - Loading plugin 'docling_defaults'
2025-11-24 11:24:32,228 - INFO - Registered picture descriptions: ['vlm', 'api']
2025-11-24 11:24:32,229 - INFO - Processing document AAPL.csv
2025-11-24 11:24:32,230 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:32,249 - INFO - Detected 7435 lines


Found 97 files to process in data\reuters_news


2025-11-24 11:24:32,539 - INFO - Finished converting document AAPL.csv in 0.45 sec.
2025-11-24 11:24:37,759 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:37,761 - INFO - Going to convert document batch...
2025-11-24 11:24:37,762 - INFO - Processing document ABBV.csv
2025-11-24 11:24:37,763 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:37,764 - INFO - Detected 457 lines
2025-11-24 11:24:37,772 - INFO - Finished converting document ABBV.csv in 0.03 sec.


Converted 'data\reuters_news\AAPL.csv' --> 'data\processed_data\company_news\AAPL.md'


2025-11-24 11:24:37,978 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:37,979 - INFO - Going to convert document batch...
2025-11-24 11:24:37,980 - INFO - Processing document ABT.csv
2025-11-24 11:24:37,980 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:37,982 - INFO - Detected 369 lines
2025-11-24 11:24:37,990 - INFO - Finished converting document ABT.csv in 0.03 sec.
2025-11-24 11:24:38,140 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:38,142 - INFO - Going to convert document batch...
2025-11-24 11:24:38,143 - INFO - Processing document ACN.csv
2025-11-24 11:24:38,143 - INFO - Parsing CSV with delimiter: ","


Converted 'data\reuters_news\ABBV.csv' --> 'data\processed_data\company_news\ABBV.md'
Converted 'data\reuters_news\ABT.csv' --> 'data\processed_data\company_news\ABT.md'


2025-11-24 11:24:38,144 - INFO - Detected 190 lines
2025-11-24 11:24:38,148 - INFO - Finished converting document ACN.csv in 0.05 sec.
2025-11-24 11:24:38,248 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:38,249 - INFO - Going to convert document batch...
2025-11-24 11:24:38,250 - INFO - Processing document ADBE.csv
2025-11-24 11:24:38,250 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:38,252 - INFO - Detected 283 lines
2025-11-24 11:24:38,259 - INFO - Finished converting document ADBE.csv in 0.05 sec.
2025-11-24 11:24:38,388 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:38,390 - INFO - Going to convert document batch...
2025-11-24 11:24:38,391 - INFO - Processing document AIG.csv
2025-11-24 11:24:38,392 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:38,393 - INFO - Detected 167 lines
2025-11-24 11:24:38,397 - INFO - Finished converting document AIG.csv in 0.03 sec.


Converted 'data\reuters_news\ACN.csv' --> 'data\processed_data\company_news\ACN.md'
Converted 'data\reuters_news\ADBE.csv' --> 'data\processed_data\company_news\ADBE.md'


2025-11-24 11:24:38,483 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:38,488 - INFO - Going to convert document batch...
2025-11-24 11:24:38,489 - INFO - Processing document AMD.csv
2025-11-24 11:24:38,490 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:38,493 - INFO - Detected 1065 lines
2025-11-24 11:24:38,513 - INFO - Finished converting document AMD.csv in 0.05 sec.


Converted 'data\reuters_news\AIG.csv' --> 'data\processed_data\company_news\AIG.md'


2025-11-24 11:24:38,885 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:38,886 - INFO - Going to convert document batch...
2025-11-24 11:24:38,887 - INFO - Processing document AMGN.csv
2025-11-24 11:24:38,887 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:38,888 - INFO - Detected 350 lines
2025-11-24 11:24:38,894 - INFO - Finished converting document AMGN.csv in 0.03 sec.
2025-11-24 11:24:39,056 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]


Converted 'data\reuters_news\AMD.csv' --> 'data\processed_data\company_news\AMD.md'
Converted 'data\reuters_news\AMGN.csv' --> 'data\processed_data\company_news\AMGN.md'


2025-11-24 11:24:39,058 - INFO - Going to convert document batch...
2025-11-24 11:24:39,060 - INFO - Processing document AMT.csv
2025-11-24 11:24:39,061 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:39,063 - INFO - Detected 62 lines
2025-11-24 11:24:39,066 - INFO - Finished converting document AMT.csv in 0.06 sec.
2025-11-24 11:24:39,115 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:39,119 - INFO - Going to convert document batch...
2025-11-24 11:24:39,120 - INFO - Processing document AMZN.csv
2025-11-24 11:24:39,121 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:39,125 - INFO - Detected 1201 lines


Converted 'data\reuters_news\AMT.csv' --> 'data\processed_data\company_news\AMT.md'


2025-11-24 11:24:39,292 - INFO - Finished converting document AMZN.csv in 0.19 sec.
2025-11-24 11:24:40,208 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:40,211 - INFO - Going to convert document batch...
2025-11-24 11:24:40,211 - INFO - Processing document AVGO.csv
2025-11-24 11:24:40,212 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:40,214 - INFO - Detected 564 lines
2025-11-24 11:24:40,225 - INFO - Finished converting document AVGO.csv in 0.03 sec.


Converted 'data\reuters_news\AMZN.csv' --> 'data\processed_data\company_news\AMZN.md'


2025-11-24 11:24:40,435 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:40,436 - INFO - Going to convert document batch...
2025-11-24 11:24:40,438 - INFO - Processing document AXP.csv
2025-11-24 11:24:40,438 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:40,440 - INFO - Detected 317 lines
2025-11-24 11:24:40,446 - INFO - Finished converting document AXP.csv in 0.03 sec.
2025-11-24 11:24:40,602 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]


Converted 'data\reuters_news\AVGO.csv' --> 'data\processed_data\company_news\AVGO.md'
Converted 'data\reuters_news\AXP.csv' --> 'data\processed_data\company_news\AXP.md'


2025-11-24 11:24:40,628 - INFO - Going to convert document batch...
2025-11-24 11:24:40,629 - INFO - Processing document BA.csv
2025-11-24 11:24:40,630 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:40,642 - INFO - Detected 4817 lines
2025-11-24 11:24:40,730 - INFO - Finished converting document BA.csv in 0.17 sec.
2025-11-24 11:24:43,247 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:43,255 - INFO - Going to convert document batch...
2025-11-24 11:24:43,256 - INFO - Processing document BAC.csv
2025-11-24 11:24:43,257 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:43,264 - INFO - Detected 2331 lines
2025-11-24 11:24:43,311 - INFO - Finished converting document BAC.csv in 0.08 sec.


Converted 'data\reuters_news\BA.csv' --> 'data\processed_data\company_news\BA.md'


2025-11-24 11:24:44,307 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:44,308 - INFO - Going to convert document batch...
2025-11-24 11:24:44,309 - INFO - Processing document BK.csv
2025-11-24 11:24:44,309 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:44,310 - INFO - Detected 293 lines
2025-11-24 11:24:44,315 - INFO - Finished converting document BK.csv in 0.01 sec.
2025-11-24 11:24:44,441 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:44,443 - INFO - Going to convert document batch...
2025-11-24 11:24:44,444 - INFO - Processing document BKNG.csv
2025-11-24 11:24:44,444 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:44,446 - INFO - Detected 171 lines
2025-11-24 11:24:44,449 - INFO - Finished converting document BKNG.csv in 0.03 sec.


Converted 'data\reuters_news\BAC.csv' --> 'data\processed_data\company_news\BAC.md'
Converted 'data\reuters_news\BK.csv' --> 'data\processed_data\company_news\BK.md'


2025-11-24 11:24:44,518 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:44,525 - INFO - Going to convert document batch...
2025-11-24 11:24:44,528 - INFO - Processing document BLK.csv
2025-11-24 11:24:44,529 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:44,533 - INFO - Detected 1811 lines
2025-11-24 11:24:44,567 - INFO - Finished converting document BLK.csv in 0.08 sec.


Converted 'data\reuters_news\BKNG.csv' --> 'data\processed_data\company_news\BKNG.md'


2025-11-24 11:24:45,806 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:45,812 - INFO - Going to convert document batch...
2025-11-24 11:24:45,813 - INFO - Processing document BMY.csv
2025-11-24 11:24:45,814 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:45,817 - INFO - Detected 413 lines
2025-11-24 11:24:45,837 - INFO - Finished converting document BMY.csv in 0.06 sec.


Converted 'data\reuters_news\BLK.csv' --> 'data\processed_data\company_news\BLK.md'


2025-11-24 11:24:46,048 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:46,056 - INFO - Going to convert document batch...
2025-11-24 11:24:46,058 - INFO - Processing document BRK.B.csv
2025-11-24 11:24:46,060 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:46,067 - INFO - Detected 870 lines
2025-11-24 11:24:46,102 - INFO - Finished converting document BRK.B.csv in 0.11 sec.


Converted 'data\reuters_news\BMY.csv' --> 'data\processed_data\company_news\BMY.md'


2025-11-24 11:24:46,647 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:46,661 - INFO - Going to convert document batch...
2025-11-24 11:24:46,662 - INFO - Processing document C.csv
2025-11-24 11:24:46,663 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:46,672 - INFO - Detected 3025 lines
2025-11-24 11:24:46,728 - INFO - Finished converting document C.csv in 0.12 sec.


Converted 'data\reuters_news\BRK.B.csv' --> 'data\processed_data\company_news\BRK.B.md'


2025-11-24 11:24:47,959 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:47,961 - INFO - Going to convert document batch...
2025-11-24 11:24:47,961 - INFO - Processing document CAT.csv
2025-11-24 11:24:47,962 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:47,963 - INFO - Detected 348 lines
2025-11-24 11:24:47,969 - INFO - Finished converting document CAT.csv in 0.05 sec.


Converted 'data\reuters_news\C.csv' --> 'data\processed_data\company_news\C.md'
Converted 'data\reuters_news\CAT.csv' --> 'data\processed_data\company_news\CAT.md'


2025-11-24 11:24:48,175 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:48,176 - INFO - Going to convert document batch...
2025-11-24 11:24:48,177 - INFO - Processing document CHTR.csv
2025-11-24 11:24:48,177 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:48,178 - INFO - Detected 118 lines
2025-11-24 11:24:48,180 - INFO - Finished converting document CHTR.csv in 0.06 sec.
2025-11-24 11:24:48,235 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:48,237 - INFO - Going to convert document batch...
2025-11-24 11:24:48,238 - INFO - Processing document CL.csv
2025-11-24 11:24:48,239 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:48,240 - INFO - Detected 98 lines
2025-11-24 11:24:48,242 - INFO - Finished converting document CL.csv in 0.03 sec.
2025-11-24 11:24:48,294 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:48,297 - INFO - Going to convert document batch...
2025-11-24 11:24:48,297 - INFO - Processi

Converted 'data\reuters_news\CHTR.csv' --> 'data\processed_data\company_news\CHTR.md'
Converted 'data\reuters_news\CL.csv' --> 'data\processed_data\company_news\CL.md'


2025-11-24 11:24:48,786 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:48,789 - INFO - Going to convert document batch...
2025-11-24 11:24:48,790 - INFO - Processing document COF.csv
2025-11-24 11:24:48,790 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:48,792 - INFO - Detected 162 lines
2025-11-24 11:24:48,795 - INFO - Finished converting document COF.csv in 0.02 sec.
2025-11-24 11:24:48,884 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:48,886 - INFO - Going to convert document batch...
2025-11-24 11:24:48,887 - INFO - Processing document COST.csv
2025-11-24 11:24:48,889 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:48,890 - INFO - Detected 273 lines
2025-11-24 11:24:48,896 - INFO - Finished converting document COST.csv in 0.03 sec.


Converted 'data\reuters_news\CMCSA.csv' --> 'data\processed_data\company_news\CMCSA.md'
Converted 'data\reuters_news\COF.csv' --> 'data\processed_data\company_news\COF.md'


2025-11-24 11:24:49,026 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:49,028 - INFO - Going to convert document batch...
2025-11-24 11:24:49,028 - INFO - Processing document CRM.csv
2025-11-24 11:24:49,029 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:49,030 - INFO - Detected 410 lines
2025-11-24 11:24:49,037 - INFO - Finished converting document CRM.csv in 0.05 sec.


Converted 'data\reuters_news\COST.csv' --> 'data\processed_data\company_news\COST.md'
Converted 'data\reuters_news\CRM.csv' --> 'data\processed_data\company_news\CRM.md'


2025-11-24 11:24:49,242 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:49,244 - INFO - Going to convert document batch...
2025-11-24 11:24:49,244 - INFO - Processing document CSCO.csv
2025-11-24 11:24:49,245 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:49,247 - INFO - Detected 363 lines
2025-11-24 11:24:49,253 - INFO - Finished converting document CSCO.csv in 0.05 sec.
2025-11-24 11:24:49,405 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:49,408 - INFO - Going to convert document batch...
2025-11-24 11:24:49,409 - INFO - Processing document CVS.csv
2025-11-24 11:24:49,410 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:49,411 - INFO - Detected 614 lines
2025-11-24 11:24:49,422 - INFO - Finished converting document CVS.csv in 0.05 sec.


Converted 'data\reuters_news\CSCO.csv' --> 'data\processed_data\company_news\CSCO.md'


2025-11-24 11:24:49,672 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:49,673 - INFO - Going to convert document batch...
2025-11-24 11:24:49,674 - INFO - Processing document DE.csv
2025-11-24 11:24:49,675 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:49,676 - INFO - Detected 190 lines
2025-11-24 11:24:49,679 - INFO - Finished converting document DE.csv in 0.03 sec.
2025-11-24 11:24:49,793 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:49,795 - INFO - Going to convert document batch...
2025-11-24 11:24:49,795 - INFO - Processing document DHR.csv
2025-11-24 11:24:49,796 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:49,796 - INFO - Detected 99 lines
2025-11-24 11:24:49,799 - INFO - Finished converting document DHR.csv in 0.05 sec.


Converted 'data\reuters_news\CVS.csv' --> 'data\processed_data\company_news\CVS.md'
Converted 'data\reuters_news\DE.csv' --> 'data\processed_data\company_news\DE.md'
Converted 'data\reuters_news\DHR.csv' --> 'data\processed_data\company_news\DHR.md'


2025-11-24 11:24:49,872 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:49,887 - INFO - Going to convert document batch...
2025-11-24 11:24:49,889 - INFO - Processing document DIS.csv
2025-11-24 11:24:49,892 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:49,899 - INFO - Detected 2060 lines
2025-11-24 11:24:49,964 - INFO - Finished converting document DIS.csv in 0.14 sec.
2025-11-24 11:24:51,935 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:51,937 - INFO - Going to convert document batch...
2025-11-24 11:24:51,937 - INFO - Processing document DUK.csv
2025-11-24 11:24:51,938 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:51,938 - INFO - Detected 135 lines
2025-11-24 11:24:51,941 - INFO - Finished converting document DUK.csv in 0.05 sec.
2025-11-24 11:24:52,017 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:52,018 - INFO - Going to convert document batch...
2025-11-24 11:24:52,019 - INFO - Proces

Converted 'data\reuters_news\DIS.csv' --> 'data\processed_data\company_news\DIS.md'
Converted 'data\reuters_news\DUK.csv' --> 'data\processed_data\company_news\DUK.md'
Converted 'data\reuters_news\EMR.csv' --> 'data\processed_data\company_news\EMR.md'


2025-11-24 11:24:52,356 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:52,358 - INFO - Going to convert document batch...
2025-11-24 11:24:52,359 - INFO - Processing document GD.csv
2025-11-24 11:24:52,360 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:52,362 - INFO - Detected 292 lines
2025-11-24 11:24:52,371 - INFO - Finished converting document GD.csv in 0.03 sec.
2025-11-24 11:24:52,517 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:52,521 - INFO - Going to convert document batch...


Converted 'data\reuters_news\FDX.csv' --> 'data\processed_data\company_news\FDX.md'
Converted 'data\reuters_news\GD.csv' --> 'data\processed_data\company_news\GD.md'


2025-11-24 11:24:52,522 - INFO - Processing document GE.csv
2025-11-24 11:24:52,523 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:52,526 - INFO - Detected 915 lines
2025-11-24 11:24:52,544 - INFO - Finished converting document GE.csv in 0.05 sec.
2025-11-24 11:24:52,928 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:24:52,930 - INFO - Going to convert document batch...
2025-11-24 11:24:52,930 - INFO - Processing document GILD.csv
2025-11-24 11:24:52,931 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:52,932 - INFO - Detected 390 lines
2025-11-24 11:24:52,939 - INFO - Finished converting document GILD.csv in 0.03 sec.
2025-11-24 11:24:53,099 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]


Converted 'data\reuters_news\GE.csv' --> 'data\processed_data\company_news\GE.md'
Converted 'data\reuters_news\GILD.csv' --> 'data\processed_data\company_news\GILD.md'


2025-11-24 11:24:53,117 - INFO - Going to convert document batch...
2025-11-24 11:24:53,118 - INFO - Processing document GOOGL.csv
2025-11-24 11:24:53,120 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:24:53,143 - INFO - Detected 7623 lines
2025-11-24 11:24:53,423 - INFO - Finished converting document GOOGL.csv in 0.34 sec.
2025-11-24 11:25:01,141 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:01,153 - INFO - Going to convert document batch...
2025-11-24 11:25:01,154 - INFO - Processing document GS.csv
2025-11-24 11:25:01,155 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:01,166 - INFO - Detected 4043 lines
2025-11-24 11:25:01,410 - INFO - Finished converting document GS.csv in 0.30 sec.


Converted 'data\reuters_news\GOOGL.csv' --> 'data\processed_data\company_news\GOOGL.md'


2025-11-24 11:25:03,288 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:03,289 - INFO - Going to convert document batch...
2025-11-24 11:25:03,290 - INFO - Processing document HD.csv
2025-11-24 11:25:03,290 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:03,292 - INFO - Detected 430 lines
2025-11-24 11:25:03,299 - INFO - Finished converting document HD.csv in 0.02 sec.
2025-11-24 11:25:03,469 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]


Converted 'data\reuters_news\GS.csv' --> 'data\processed_data\company_news\GS.md'
Converted 'data\reuters_news\HD.csv' --> 'data\processed_data\company_news\HD.md'


2025-11-24 11:25:03,471 - INFO - Going to convert document batch...
2025-11-24 11:25:03,472 - INFO - Processing document HON.csv
2025-11-24 11:25:03,472 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:03,473 - INFO - Detected 292 lines
2025-11-24 11:25:03,478 - INFO - Finished converting document HON.csv in 0.03 sec.
2025-11-24 11:25:03,742 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:03,745 - INFO - Going to convert document batch...
2025-11-24 11:25:03,745 - INFO - Processing document IBM.csv
2025-11-24 11:25:03,746 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:03,747 - INFO - Detected 524 lines
2025-11-24 11:25:03,757 - INFO - Finished converting document IBM.csv in 0.03 sec.


Converted 'data\reuters_news\HON.csv' --> 'data\processed_data\company_news\HON.md'


2025-11-24 11:25:03,995 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:04,003 - INFO - Going to convert document batch...
2025-11-24 11:25:04,003 - INFO - Processing document INTC.csv
2025-11-24 11:25:04,004 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:04,009 - INFO - Detected 1941 lines
2025-11-24 11:25:04,049 - INFO - Finished converting document INTC.csv in 0.08 sec.


Converted 'data\reuters_news\IBM.csv' --> 'data\processed_data\company_news\IBM.md'


2025-11-24 11:25:04,945 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:04,946 - INFO - Going to convert document batch...
2025-11-24 11:25:04,947 - INFO - Processing document INTU.csv
2025-11-24 11:25:04,947 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:04,949 - INFO - Detected 76 lines
2025-11-24 11:25:04,951 - INFO - Finished converting document INTU.csv in 0.02 sec.
2025-11-24 11:25:05,013 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:05,016 - INFO - Going to convert document batch...
2025-11-24 11:25:05,017 - INFO - Processing document ISRG.csv
2025-11-24 11:25:05,018 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:05,020 - INFO - Detected 55 lines
2025-11-24 11:25:05,024 - INFO - Finished converting document ISRG.csv in 0.03 sec.
2025-11-24 11:25:05,076 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:05,089 - INFO - Going to convert document batch...
2025-11-24 11:25:05,090 - INFO - Proce

Converted 'data\reuters_news\INTC.csv' --> 'data\processed_data\company_news\INTC.md'
Converted 'data\reuters_news\INTU.csv' --> 'data\processed_data\company_news\INTU.md'
Converted 'data\reuters_news\ISRG.csv' --> 'data\processed_data\company_news\ISRG.md'


2025-11-24 11:25:05,135 - INFO - Finished converting document JNJ.csv in 0.08 sec.
2025-11-24 11:25:06,183 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:06,195 - INFO - Going to convert document batch...
2025-11-24 11:25:06,197 - INFO - Processing document JPM.csv
2025-11-24 11:25:06,198 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:06,212 - INFO - Detected 4211 lines
2025-11-24 11:25:06,291 - INFO - Finished converting document JPM.csv in 0.12 sec.


Converted 'data\reuters_news\JNJ.csv' --> 'data\processed_data\company_news\JNJ.md'


2025-11-24 11:25:08,432 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:08,435 - INFO - Going to convert document batch...
2025-11-24 11:25:08,436 - INFO - Processing document KO.csv
2025-11-24 11:25:08,436 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:08,438 - INFO - Detected 592 lines
2025-11-24 11:25:08,448 - INFO - Finished converting document KO.csv in 0.03 sec.


Converted 'data\reuters_news\JPM.csv' --> 'data\processed_data\company_news\JPM.md'


2025-11-24 11:25:08,694 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:08,696 - INFO - Going to convert document batch...
2025-11-24 11:25:08,699 - INFO - Processing document LIN.csv
2025-11-24 11:25:08,700 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:08,701 - INFO - Detected 103 lines
2025-11-24 11:25:08,703 - INFO - Finished converting document LIN.csv in 0.02 sec.
2025-11-24 11:25:08,757 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:08,762 - INFO - Going to convert document batch...
2025-11-24 11:25:08,765 - INFO - Processing document LLY.csv
2025-11-24 11:25:08,766 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:08,770 - INFO - Detected 1561 lines
2025-11-24 11:25:08,800 - INFO - Finished converting document LLY.csv in 0.08 sec.


Converted 'data\reuters_news\KO.csv' --> 'data\processed_data\company_news\KO.md'
Converted 'data\reuters_news\LIN.csv' --> 'data\processed_data\company_news\LIN.md'


2025-11-24 11:25:09,447 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:09,451 - INFO - Going to convert document batch...
2025-11-24 11:25:09,451 - INFO - Processing document LMT.csv
2025-11-24 11:25:09,452 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:09,455 - INFO - Detected 1231 lines
2025-11-24 11:25:09,476 - INFO - Finished converting document LMT.csv in 0.05 sec.


Converted 'data\reuters_news\LLY.csv' --> 'data\processed_data\company_news\LLY.md'


2025-11-24 11:25:10,020 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:10,022 - INFO - Going to convert document batch...
2025-11-24 11:25:10,022 - INFO - Processing document LOW.csv
2025-11-24 11:25:10,023 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:10,024 - INFO - Detected 221 lines
2025-11-24 11:25:10,028 - INFO - Finished converting document LOW.csv in 0.02 sec.
2025-11-24 11:25:10,123 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:10,126 - INFO - Going to convert document batch...
2025-11-24 11:25:10,126 - INFO - Processing document MA.csv
2025-11-24 11:25:10,127 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:10,129 - INFO - Detected 558 lines
2025-11-24 11:25:10,275 - INFO - Finished converting document MA.csv in 0.17 sec.


Converted 'data\reuters_news\LMT.csv' --> 'data\processed_data\company_news\LMT.md'
Converted 'data\reuters_news\LOW.csv' --> 'data\processed_data\company_news\LOW.md'


2025-11-24 11:25:10,503 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:10,508 - INFO - Going to convert document batch...
2025-11-24 11:25:10,508 - INFO - Processing document MCD.csv
2025-11-24 11:25:10,509 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:10,511 - INFO - Detected 814 lines
2025-11-24 11:25:10,526 - INFO - Finished converting document MCD.csv in 0.05 sec.


Converted 'data\reuters_news\MA.csv' --> 'data\processed_data\company_news\MA.md'


2025-11-24 11:25:10,879 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:10,880 - INFO - Going to convert document batch...
2025-11-24 11:25:10,881 - INFO - Processing document MDLZ.csv
2025-11-24 11:25:10,881 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:10,883 - INFO - Detected 261 lines
2025-11-24 11:25:10,888 - INFO - Finished converting document MDLZ.csv in 0.03 sec.
2025-11-24 11:25:11,003 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:11,004 - INFO - Going to convert document batch...
2025-11-24 11:25:11,005 - INFO - Processing document MDT.csv
2025-11-24 11:25:11,005 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:11,006 - INFO - Detected 132 lines
2025-11-24 11:25:11,009 - INFO - Finished converting document MDT.csv in 0.03 sec.


Converted 'data\reuters_news\MCD.csv' --> 'data\processed_data\company_news\MCD.md'
Converted 'data\reuters_news\MDLZ.csv' --> 'data\processed_data\company_news\MDLZ.md'


2025-11-24 11:25:11,087 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:11,089 - INFO - Going to convert document batch...
2025-11-24 11:25:11,089 - INFO - Processing document MET.csv
2025-11-24 11:25:11,090 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:11,090 - INFO - Detected 72 lines
2025-11-24 11:25:11,093 - INFO - Finished converting document MET.csv in 0.02 sec.
2025-11-24 11:25:11,135 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:11,149 - INFO - Going to convert document batch...
2025-11-24 11:25:11,150 - INFO - Processing document META.csv
2025-11-24 11:25:11,150 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:11,162 - INFO - Detected 5077 lines
2025-11-24 11:25:11,248 - INFO - Finished converting document META.csv in 0.12 sec.


Converted 'data\reuters_news\MDT.csv' --> 'data\processed_data\company_news\MDT.md'
Converted 'data\reuters_news\MET.csv' --> 'data\processed_data\company_news\MET.md'


2025-11-24 11:25:14,089 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:14,090 - INFO - Going to convert document batch...
2025-11-24 11:25:14,091 - INFO - Processing document MMM.csv
2025-11-24 11:25:14,091 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:14,093 - INFO - Detected 285 lines
2025-11-24 11:25:14,098 - INFO - Finished converting document MMM.csv in 0.03 sec.
2025-11-24 11:25:14,241 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:14,241 - INFO - Going to convert document batch...
2025-11-24 11:25:14,243 - INFO - Processing document MO.csv
2025-11-24 11:25:14,244 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:14,244 - INFO - Detected 152 lines
2025-11-24 11:25:14,247 - INFO - Finished converting document MO.csv in 0.03 sec.


Converted 'data\reuters_news\META.csv' --> 'data\processed_data\company_news\META.md'
Converted 'data\reuters_news\MMM.csv' --> 'data\processed_data\company_news\MMM.md'


2025-11-24 11:25:14,315 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:14,319 - INFO - Going to convert document batch...
2025-11-24 11:25:14,320 - INFO - Processing document MRK.csv
2025-11-24 11:25:14,320 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:14,323 - INFO - Detected 1010 lines
2025-11-24 11:25:14,341 - INFO - Finished converting document MRK.csv in 0.05 sec.


Converted 'data\reuters_news\MO.csv' --> 'data\processed_data\company_news\MO.md'


2025-11-24 11:25:14,893 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:14,901 - INFO - Going to convert document batch...
2025-11-24 11:25:14,902 - INFO - Processing document MS.csv
2025-11-24 11:25:14,902 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:14,909 - INFO - Detected 2314 lines
2025-11-24 11:25:14,952 - INFO - Finished converting document MS.csv in 0.08 sec.


Converted 'data\reuters_news\MRK.csv' --> 'data\processed_data\company_news\MRK.md'


2025-11-24 11:25:15,929 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:15,952 - INFO - Going to convert document batch...
2025-11-24 11:25:15,953 - INFO - Processing document MSFT.csv
2025-11-24 11:25:15,953 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:15,969 - INFO - Detected 6444 lines


Converted 'data\reuters_news\MS.csv' --> 'data\processed_data\company_news\MS.md'


2025-11-24 11:25:16,234 - INFO - Finished converting document MSFT.csv in 0.31 sec.
2025-11-24 11:25:20,132 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:20,134 - INFO - Going to convert document batch...
2025-11-24 11:25:20,134 - INFO - Processing document NEE.csv
2025-11-24 11:25:20,135 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:20,136 - INFO - Detected 177 lines
2025-11-24 11:25:20,139 - INFO - Finished converting document NEE.csv in 0.02 sec.
2025-11-24 11:25:20,246 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:20,252 - INFO - Going to convert document batch...
2025-11-24 11:25:20,252 - INFO - Processing document NFLX.csv
2025-11-24 11:25:20,253 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:20,258 - INFO - Detected 2039 lines


Converted 'data\reuters_news\MSFT.csv' --> 'data\processed_data\company_news\MSFT.md'
Converted 'data\reuters_news\NEE.csv' --> 'data\processed_data\company_news\NEE.md'


2025-11-24 11:25:20,296 - INFO - Finished converting document NFLX.csv in 0.08 sec.
2025-11-24 11:25:21,857 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:21,861 - INFO - Going to convert document batch...
2025-11-24 11:25:21,862 - INFO - Processing document NKE.csv
2025-11-24 11:25:21,862 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:21,865 - INFO - Detected 879 lines
2025-11-24 11:25:21,881 - INFO - Finished converting document NKE.csv in 0.05 sec.


Converted 'data\reuters_news\NFLX.csv' --> 'data\processed_data\company_news\NFLX.md'


2025-11-24 11:25:22,247 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:22,248 - INFO - Going to convert document batch...
2025-11-24 11:25:22,249 - INFO - Processing document NOW.csv
2025-11-24 11:25:22,249 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:22,250 - INFO - Detected 64 lines
2025-11-24 11:25:22,252 - INFO - Finished converting document NOW.csv in 0.02 sec.
2025-11-24 11:25:22,291 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:22,303 - INFO - Going to convert document batch...
2025-11-24 11:25:22,304 - INFO - Processing document NVDA.csv
2025-11-24 11:25:22,304 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:22,315 - INFO - Detected 4582 lines
2025-11-24 11:25:22,392 - INFO - Finished converting document NVDA.csv in 0.11 sec.


Converted 'data\reuters_news\NKE.csv' --> 'data\processed_data\company_news\NKE.md'
Converted 'data\reuters_news\NOW.csv' --> 'data\processed_data\company_news\NOW.md'


2025-11-24 11:25:26,464 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:26,466 - INFO - Going to convert document batch...
2025-11-24 11:25:26,467 - INFO - Processing document ORCL.csv
2025-11-24 11:25:26,467 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:26,469 - INFO - Detected 815 lines
2025-11-24 11:25:26,483 - INFO - Finished converting document ORCL.csv in 0.03 sec.


Converted 'data\reuters_news\NVDA.csv' --> 'data\processed_data\company_news\NVDA.md'


2025-11-24 11:25:26,822 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:26,825 - INFO - Going to convert document batch...
2025-11-24 11:25:26,826 - INFO - Processing document PEP.csv
2025-11-24 11:25:26,827 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:26,828 - INFO - Detected 591 lines
2025-11-24 11:25:26,838 - INFO - Finished converting document PEP.csv in 0.05 sec.


Converted 'data\reuters_news\ORCL.csv' --> 'data\processed_data\company_news\ORCL.md'


2025-11-24 11:25:27,072 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:27,089 - INFO - Going to convert document batch...
2025-11-24 11:25:27,090 - INFO - Processing document PFE.csv
2025-11-24 11:25:27,091 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:27,105 - INFO - Detected 5219 lines


Converted 'data\reuters_news\PEP.csv' --> 'data\processed_data\company_news\PEP.md'


2025-11-24 11:25:27,346 - INFO - Finished converting document PFE.csv in 0.28 sec.
2025-11-24 11:25:30,171 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:30,173 - INFO - Going to convert document batch...
2025-11-24 11:25:30,174 - INFO - Processing document PG.csv
2025-11-24 11:25:30,175 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:30,176 - INFO - Detected 101 lines
2025-11-24 11:25:30,179 - INFO - Finished converting document PG.csv in 0.03 sec.
2025-11-24 11:25:30,268 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:30,270 - INFO - Going to convert document batch...
2025-11-24 11:25:30,271 - INFO - Processing document PLTR.csv
2025-11-24 11:25:30,271 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:30,273 - INFO - Detected 294 lines
2025-11-24 11:25:30,279 - INFO - Finished converting document PLTR.csv in 0.05 sec.


Converted 'data\reuters_news\PFE.csv' --> 'data\processed_data\company_news\PFE.md'
Converted 'data\reuters_news\PG.csv' --> 'data\processed_data\company_news\PG.md'


2025-11-24 11:25:30,412 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:30,414 - INFO - Going to convert document batch...
2025-11-24 11:25:30,415 - INFO - Processing document PM.csv
2025-11-24 11:25:30,415 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:30,417 - INFO - Detected 252 lines
2025-11-24 11:25:30,424 - INFO - Finished converting document PM.csv in 0.02 sec.
2025-11-24 11:25:30,553 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:30,556 - INFO - Going to convert document batch...
2025-11-24 11:25:30,557 - INFO - Processing document PYPL.csv
2025-11-24 11:25:30,558 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:30,559 - INFO - Detected 497 lines
2025-11-24 11:25:30,567 - INFO - Finished converting document PYPL.csv in 0.03 sec.


Converted 'data\reuters_news\PLTR.csv' --> 'data\processed_data\company_news\PLTR.md'
Converted 'data\reuters_news\PM.csv' --> 'data\processed_data\company_news\PM.md'


2025-11-24 11:25:30,817 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:30,821 - INFO - Going to convert document batch...
2025-11-24 11:25:30,821 - INFO - Processing document QCOM.csv
2025-11-24 11:25:30,822 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:30,825 - INFO - Detected 888 lines
2025-11-24 11:25:30,841 - INFO - Finished converting document QCOM.csv in 0.05 sec.


Converted 'data\reuters_news\PYPL.csv' --> 'data\processed_data\company_news\PYPL.md'


2025-11-24 11:25:31,223 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:31,225 - INFO - Going to convert document batch...
2025-11-24 11:25:31,226 - INFO - Processing document RTX.csv
2025-11-24 11:25:31,227 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:31,230 - INFO - Detected 521 lines
2025-11-24 11:25:31,239 - INFO - Finished converting document RTX.csv in 0.06 sec.


Converted 'data\reuters_news\QCOM.csv' --> 'data\processed_data\company_news\QCOM.md'


2025-11-24 11:25:31,447 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:31,450 - INFO - Going to convert document batch...
2025-11-24 11:25:31,451 - INFO - Processing document SBUX.csv
2025-11-24 11:25:31,452 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:31,456 - INFO - Detected 801 lines
2025-11-24 11:25:31,470 - INFO - Finished converting document SBUX.csv in 0.03 sec.


Converted 'data\reuters_news\RTX.csv' --> 'data\processed_data\company_news\RTX.md'


2025-11-24 11:25:31,835 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:31,836 - INFO - Going to convert document batch...
2025-11-24 11:25:31,837 - INFO - Processing document SCHW.csv
2025-11-24 11:25:31,838 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:31,839 - INFO - Detected 240 lines
2025-11-24 11:25:31,843 - INFO - Finished converting document SCHW.csv in 0.02 sec.
2025-11-24 11:25:31,949 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:31,949 - INFO - Going to convert document batch...
2025-11-24 11:25:31,950 - INFO - Processing document SO.csv
2025-11-24 11:25:31,951 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:31,951 - INFO - Detected 88 lines
2025-11-24 11:25:31,953 - INFO - Finished converting document SO.csv in 0.02 sec.
2025-11-24 11:25:31,991 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:31,992 - INFO - Going to convert document batch...
2025-11-24 11:25:31,993 - INFO - Processi

Converted 'data\reuters_news\SBUX.csv' --> 'data\processed_data\company_news\SBUX.md'
Converted 'data\reuters_news\SCHW.csv' --> 'data\processed_data\company_news\SCHW.md'
Converted 'data\reuters_news\SO.csv' --> 'data\processed_data\company_news\SO.md'


2025-11-24 11:25:32,037 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:32,041 - INFO - Going to convert document batch...
2025-11-24 11:25:32,041 - INFO - Processing document T.csv
2025-11-24 11:25:32,042 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:32,045 - INFO - Detected 887 lines
2025-11-24 11:25:32,061 - INFO - Finished converting document T.csv in 0.03 sec.


Converted 'data\reuters_news\SPG.csv' --> 'data\processed_data\company_news\SPG.md'


2025-11-24 11:25:32,606 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:32,610 - INFO - Going to convert document batch...
2025-11-24 11:25:32,611 - INFO - Processing document TGT.csv
2025-11-24 11:25:32,611 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:32,614 - INFO - Detected 988 lines
2025-11-24 11:25:32,630 - INFO - Finished converting document TGT.csv in 0.08 sec.


Converted 'data\reuters_news\T.csv' --> 'data\processed_data\company_news\T.md'


2025-11-24 11:25:33,073 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:33,075 - INFO - Going to convert document batch...
2025-11-24 11:25:33,075 - INFO - Processing document TMO.csv
2025-11-24 11:25:33,076 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:33,076 - INFO - Detected 174 lines
2025-11-24 11:25:33,079 - INFO - Finished converting document TMO.csv in 0.02 sec.
2025-11-24 11:25:33,184 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:33,188 - INFO - Going to convert document batch...
2025-11-24 11:25:33,189 - INFO - Processing document TMUS.csv
2025-11-24 11:25:33,190 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:33,192 - INFO - Detected 417 lines
2025-11-24 11:25:33,201 - INFO - Finished converting document TMUS.csv in 0.06 sec.


Converted 'data\reuters_news\TGT.csv' --> 'data\processed_data\company_news\TGT.md'
Converted 'data\reuters_news\TMO.csv' --> 'data\processed_data\company_news\TMO.md'


2025-11-24 11:25:33,373 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:33,396 - INFO - Going to convert document batch...
2025-11-24 11:25:33,397 - INFO - Processing document TSLA.csv
2025-11-24 11:25:33,398 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:33,418 - INFO - Detected 8548 lines


Converted 'data\reuters_news\TMUS.csv' --> 'data\processed_data\company_news\TMUS.md'


2025-11-24 11:25:33,725 - INFO - Finished converting document TSLA.csv in 0.38 sec.
2025-11-24 11:25:40,134 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:40,136 - INFO - Going to convert document batch...
2025-11-24 11:25:40,137 - INFO - Processing document TXN.csv
2025-11-24 11:25:40,138 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:40,139 - INFO - Detected 207 lines
2025-11-24 11:25:40,143 - INFO - Finished converting document TXN.csv in 0.02 sec.
2025-11-24 11:25:40,252 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:40,256 - INFO - Going to convert document batch...
2025-11-24 11:25:40,257 - INFO - Processing document UNH.csv
2025-11-24 11:25:40,257 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:40,260 - INFO - Detected 711 lines
2025-11-24 11:25:40,276 - INFO - Finished converting document UNH.csv in 0.05 sec.


Converted 'data\reuters_news\TSLA.csv' --> 'data\processed_data\company_news\TSLA.md'
Converted 'data\reuters_news\TXN.csv' --> 'data\processed_data\company_news\TXN.md'


2025-11-24 11:25:40,564 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:40,566 - INFO - Going to convert document batch...
2025-11-24 11:25:40,566 - INFO - Processing document UNP.csv
2025-11-24 11:25:40,567 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:40,568 - INFO - Detected 244 lines
2025-11-24 11:25:40,573 - INFO - Finished converting document UNP.csv in 0.03 sec.
2025-11-24 11:25:40,699 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:40,701 - INFO - Going to convert document batch...
2025-11-24 11:25:40,701 - INFO - Processing document UPS.csv
2025-11-24 11:25:40,702 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:40,704 - INFO - Detected 555 lines
2025-11-24 11:25:40,715 - INFO - Finished converting document UPS.csv in 0.05 sec.


Converted 'data\reuters_news\UNH.csv' --> 'data\processed_data\company_news\UNH.md'
Converted 'data\reuters_news\UNP.csv' --> 'data\processed_data\company_news\UNP.md'


2025-11-24 11:25:40,959 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:40,961 - INFO - Going to convert document batch...
2025-11-24 11:25:40,962 - INFO - Processing document USB.csv
2025-11-24 11:25:40,962 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:40,963 - INFO - Detected 181 lines
2025-11-24 11:25:40,966 - INFO - Finished converting document USB.csv in 0.03 sec.
2025-11-24 11:25:41,070 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:41,075 - INFO - Going to convert document batch...
2025-11-24 11:25:41,075 - INFO - Processing document V.csv
2025-11-24 11:25:41,076 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:41,078 - INFO - Detected 590 lines
2025-11-24 11:25:41,090 - INFO - Finished converting document V.csv in 0.05 sec.


Converted 'data\reuters_news\UPS.csv' --> 'data\processed_data\company_news\UPS.md'
Converted 'data\reuters_news\USB.csv' --> 'data\processed_data\company_news\USB.md'


2025-11-24 11:25:41,333 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:41,336 - INFO - Going to convert document batch...
2025-11-24 11:25:41,337 - INFO - Processing document VZ.csv
2025-11-24 11:25:41,338 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:41,340 - INFO - Detected 650 lines
2025-11-24 11:25:41,355 - INFO - Finished converting document VZ.csv in 0.05 sec.


Converted 'data\reuters_news\V.csv' --> 'data\processed_data\company_news\V.md'


2025-11-24 11:25:41,650 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:41,654 - INFO - Going to convert document batch...
2025-11-24 11:25:41,655 - INFO - Processing document WFC.csv
2025-11-24 11:25:41,656 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:41,659 - INFO - Detected 701 lines
2025-11-24 11:25:41,674 - INFO - Finished converting document WFC.csv in 0.06 sec.


Converted 'data\reuters_news\VZ.csv' --> 'data\processed_data\company_news\VZ.md'


2025-11-24 11:25:42,099 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:42,107 - INFO - Going to convert document batch...
2025-11-24 11:25:42,108 - INFO - Processing document WMT.csv
2025-11-24 11:25:42,109 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:42,115 - INFO - Detected 2585 lines
2025-11-24 11:25:42,161 - INFO - Finished converting document WMT.csv in 0.08 sec.


Converted 'data\reuters_news\WFC.csv' --> 'data\processed_data\company_news\WFC.md'


2025-11-24 11:25:43,520 - INFO - detected formats: [<InputFormat.CSV: 'csv'>]
2025-11-24 11:25:43,522 - INFO - Going to convert document batch...
2025-11-24 11:25:43,523 - INFO - Processing document XOM.csv
2025-11-24 11:25:43,524 - INFO - Parsing CSV with delimiter: ","
2025-11-24 11:25:43,524 - INFO - Detected 45 lines
2025-11-24 11:25:43,526 - INFO - Finished converting document XOM.csv in 0.03 sec.


Converted 'data\reuters_news\WMT.csv' --> 'data\processed_data\company_news\WMT.md'
Converted 'data\reuters_news\XOM.csv' --> 'data\processed_data\company_news\XOM.md'
Processed 97 new files. Errors: 0
